diff --git "a/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" "b/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" --- "a/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" +++ "b/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.4804, "train/learning_rate": 8.403483309143687e-06, "train/epoch": 0.84, "train/global_step": 1000, "_runtime": 5811, "_timestamp": 1646128663, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 70.0, 942.0, 4.0, 1.0], "bins": [-1010.7235107421875, -994.23681640625, -977.7501220703125, -961.263427734375, -944.7767333984375, -928.2900390625, -911.8033447265625, -895.316650390625, -878.8299560546875, -862.34326171875, -845.8565673828125, -829.369873046875, -812.8831787109375, -796.396484375, -779.9097900390625, -763.423095703125, -746.9364013671875, -730.44970703125, -713.9630126953125, -697.476318359375, -680.9896240234375, -664.5029296875, -648.0162353515625, -631.529541015625, -615.0429077148438, -598.5562133789062, -582.0695190429688, -565.5828247070312, -549.0961303710938, -532.6094360351562, -516.1227416992188, -499.63604736328125, -483.1492919921875, -466.66259765625, -450.1759033203125, -433.689208984375, -417.2025146484375, -400.7158203125, -384.2291259765625, -367.742431640625, -351.2557678222656, -334.7690734863281, -318.2823791503906, -301.7956848144531, -285.3089904785156, -268.8222961425781, -252.3356170654297, -235.8489227294922, -219.3622283935547, -202.8755340576172, -186.3888397216797, -169.90216064453125, -153.41546630859375, -136.92877197265625, -120.44207763671875, -103.95538330078125, -87.46868896484375, -70.98199462890625, -54.495304107666016, -38.00861358642578, -21.52191925048828, -5.035224914550781, 11.451461791992188, 27.938156127929688, 44.42485427856445]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 12.0, 15.0, 13.0, 27.0, 33.0, 36.0, 44.0, 59.0, 52.0, 54.0, 74.0, 68.0, 69.0, 71.0, 83.0, 52.0, 68.0, 43.0, 31.0, 28.0, 16.0, 8.0, 16.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.25445556640625, -85.712890625, -83.17133331298828, -80.62977600097656, -78.08821105957031, -75.54664611816406, -73.00508880615234, -70.46353149414062, -67.92196655273438, -65.38040161132812, -62.838844299316406, -60.29728317260742, -57.75572204589844, -55.21416091918945, -52.67259979248047, -50.131038665771484, -47.5894775390625, -45.047916412353516, -42.50635528564453, -39.96479415893555, -37.42323303222656, -34.88167190551758, -32.340110778808594, -29.79854965209961, -27.256988525390625, -24.71542739868164, -22.173866271972656, -19.632305145263672, -17.090744018554688, -14.549182891845703, -12.007621765136719, -9.466060638427734, -6.92449951171875, -4.382938385009766, -1.8413772583007812, 0.7001838684082031, 3.2417449951171875, 5.783306121826172, 8.324867248535156, 10.86642837524414, 13.407989501953125, 15.94955062866211, 18.491111755371094, 21.032672882080078, 23.574234008789062, 26.115795135498047, 28.65735626220703, 31.198917388916016, 33.740478515625, 36.282039642333984, 38.82360076904297, 41.36516189575195, 43.90672302246094, 46.44828414916992, 48.989845275878906, 51.53140640258789, 54.072967529296875, 56.61452865600586, 59.156089782714844, 61.69765090942383, 64.23921203613281, 66.78077697753906, 69.32233428955078, 71.8638916015625, 74.40545654296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 10.0, 8.0, 11.0, 24.0, 23.0, 24.0, 26.0, 30.0, 30.0, 29.0, 35.0, 40.0, 49.0, 40.0, 44.0, 56.0, 33.0, 58.0, 48.0, 52.0, 46.0, 43.0, 38.0, 34.0, 34.0, 22.0, 23.0, 16.0, 16.0, 13.0, 10.0, 6.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.645721435546875, -2.55120849609375, -2.456695556640625, -2.3621826171875, -2.267669677734375, -2.17315673828125, -2.078643798828125, -1.984130859375, -1.889617919921875, -1.79510498046875, -1.700592041015625, -1.6060791015625, -1.511566162109375, -1.41705322265625, -1.322540283203125, -1.22802734375, -1.133514404296875, -1.03900146484375, -0.944488525390625, -0.8499755859375, -0.755462646484375, -0.66094970703125, -0.566436767578125, -0.471923828125, -0.377410888671875, -0.28289794921875, -0.188385009765625, -0.0938720703125, 0.000640869140625, 0.09515380859375, 0.189666748046875, 0.2841796875, 0.378692626953125, 0.47320556640625, 0.567718505859375, 0.6622314453125, 0.756744384765625, 0.85125732421875, 0.945770263671875, 1.040283203125, 1.134796142578125, 1.22930908203125, 1.323822021484375, 1.4183349609375, 1.512847900390625, 1.60736083984375, 1.701873779296875, 1.79638671875, 1.890899658203125, 1.98541259765625, 2.079925537109375, 2.1744384765625, 2.268951416015625, 2.36346435546875, 2.457977294921875, 2.552490234375, 2.647003173828125, 2.74151611328125, 2.836029052734375, 2.9305419921875, 3.025054931640625, 3.11956787109375, 3.214080810546875, 3.30859375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 14.0, 15.0, 15.0, 18.0, 37.0, 53.0, 67.0, 83.0, 139.0, 161.0, 242.0, 379.0, 597.0, 1060.0, 1913.0, 3964.0, 9416.0, 28342.0, 137510.0, 1417279.0, 2290309.0, 239549.0, 40803.0, 12052.0, 4796.0, 2235.0, 1185.0, 687.0, 427.0, 259.0, 184.0, 129.0, 92.0, 63.0, 62.0, 31.0, 24.0, 18.0, 11.0, 16.0, 6.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.265625, -9.9461669921875, -9.626708984375, -9.3072509765625, -8.98779296875, -8.6683349609375, -8.348876953125, -8.0294189453125, -7.7099609375, -7.3905029296875, -7.071044921875, -6.7515869140625, -6.43212890625, -6.1126708984375, -5.793212890625, -5.4737548828125, -5.154296875, -4.8348388671875, -4.515380859375, -4.1959228515625, -3.87646484375, -3.5570068359375, -3.237548828125, -2.9180908203125, -2.5986328125, -2.2791748046875, -1.959716796875, -1.6402587890625, -1.32080078125, -1.0013427734375, -0.681884765625, -0.3624267578125, -0.04296875, 0.2764892578125, 0.595947265625, 0.9154052734375, 1.23486328125, 1.5543212890625, 1.873779296875, 2.1932373046875, 2.5126953125, 2.8321533203125, 3.151611328125, 3.4710693359375, 3.79052734375, 4.1099853515625, 4.429443359375, 4.7489013671875, 5.068359375, 5.3878173828125, 5.707275390625, 6.0267333984375, 6.34619140625, 6.6656494140625, 6.985107421875, 7.3045654296875, 7.6240234375, 7.9434814453125, 8.262939453125, 8.5823974609375, 8.90185546875, 9.2213134765625, 9.540771484375, 9.8602294921875, 10.1796875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 22.0, 31.0, 91.0, 197.0, 331.0, 726.0, 1163.0, 766.0, 393.0, 185.0, 85.0, 42.0, 16.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.828125, -31.024169921875, -30.22021484375, -29.416259765625, -28.6123046875, -27.808349609375, -27.00439453125, -26.200439453125, -25.396484375, -24.592529296875, -23.78857421875, -22.984619140625, -22.1806640625, -21.376708984375, -20.57275390625, -19.768798828125, -18.96484375, -18.160888671875, -17.35693359375, -16.552978515625, -15.7490234375, -14.945068359375, -14.14111328125, -13.337158203125, -12.533203125, -11.729248046875, -10.92529296875, -10.121337890625, -9.3173828125, -8.513427734375, -7.70947265625, -6.905517578125, -6.1015625, -5.297607421875, -4.49365234375, -3.689697265625, -2.8857421875, -2.081787109375, -1.27783203125, -0.473876953125, 0.330078125, 1.134033203125, 1.93798828125, 2.741943359375, 3.5458984375, 4.349853515625, 5.15380859375, 5.957763671875, 6.76171875, 7.565673828125, 8.36962890625, 9.173583984375, 9.9775390625, 10.781494140625, 11.58544921875, 12.389404296875, 13.193359375, 13.997314453125, 14.80126953125, 15.605224609375, 16.4091796875, 17.213134765625, 18.01708984375, 18.821044921875, 19.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 16.0, 14.0, 18.0, 63.0, 170.0, 428.0, 1179.0, 5299.0, 3992841.0, 190540.0, 2456.0, 776.0, 264.0, 118.0, 43.0, 20.0, 10.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.1875, -91.4013671875, -88.615234375, -85.8291015625, -83.04296875, -80.2568359375, -77.470703125, -74.6845703125, -71.8984375, -69.1123046875, -66.326171875, -63.5400390625, -60.75390625, -57.9677734375, -55.181640625, -52.3955078125, -49.609375, -46.8232421875, -44.037109375, -41.2509765625, -38.46484375, -35.6787109375, -32.892578125, -30.1064453125, -27.3203125, -24.5341796875, -21.748046875, -18.9619140625, -16.17578125, -13.3896484375, -10.603515625, -7.8173828125, -5.03125, -2.2451171875, 0.541015625, 3.3271484375, 6.11328125, 8.8994140625, 11.685546875, 14.4716796875, 17.2578125, 20.0439453125, 22.830078125, 25.6162109375, 28.40234375, 31.1884765625, 33.974609375, 36.7607421875, 39.546875, 42.3330078125, 45.119140625, 47.9052734375, 50.69140625, 53.4775390625, 56.263671875, 59.0498046875, 61.8359375, 64.6220703125, 67.408203125, 70.1943359375, 72.98046875, 75.7666015625, 78.552734375, 81.3388671875, 84.125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [16.0, 667.0, 329.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.600341796875, -8.848542213439941, 0.9032573699951172, 10.65505599975586, 20.406856536865234, 30.15865707397461, 39.91045379638672, 49.662254333496094, 59.41405487060547, 69.16585540771484, 78.91765594482422, 88.66944885253906, 98.42124938964844, 108.17304992675781, 117.92485046386719, 127.67665100097656, 137.42845153808594, 147.1802520751953, 156.9320526123047, 166.68385314941406, 176.43565368652344, 186.1874542236328, 195.93923950195312, 205.6910400390625, 215.44284057617188, 225.19464111328125, 234.94644165039062, 244.6982421875, 254.45004272460938, 264.20184326171875, 273.9536437988281, 283.7054443359375, 293.4572448730469, 303.20904541015625, 312.9608459472656, 322.712646484375, 332.4644470214844, 342.21624755859375, 351.9680480957031, 361.7198486328125, 371.4716491699219, 381.22344970703125, 390.9752502441406, 400.72705078125, 410.4788513183594, 420.23065185546875, 429.9824523925781, 439.7342529296875, 449.48602294921875, 459.2378234863281, 468.9896240234375, 478.7414245605469, 488.49322509765625, 498.2450256347656, 507.996826171875, 517.7485961914062, 527.5004272460938, 537.252197265625, 547.0040283203125, 556.7557983398438, 566.5076293945312, 576.2593994140625, 586.01123046875, 595.7630004882812, 605.5148315429688]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 6.0, 11.0, 15.0, 14.0, 27.0, 27.0, 24.0, 29.0, 41.0, 31.0, 40.0, 43.0, 48.0, 45.0, 52.0, 43.0, 38.0, 42.0, 42.0, 61.0, 31.0, 37.0, 38.0, 43.0, 24.0, 22.0, 17.0, 22.0, 11.0, 10.0, 12.0, 11.0, 9.0, 4.0, 8.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.319793701171875, -43.89503860473633, -42.47028350830078, -41.0455322265625, -39.62077713012695, -38.196022033691406, -36.771270751953125, -35.34651565551758, -33.92176055908203, -32.497005462646484, -31.07225227355957, -29.647499084472656, -28.22274398803711, -26.797988891601562, -25.37323570251465, -23.948482513427734, -22.523727416992188, -21.09897232055664, -19.674219131469727, -18.249465942382812, -16.824710845947266, -15.399956703186035, -13.975202560424805, -12.550448417663574, -11.125694274902344, -9.700940132141113, -8.276185989379883, -6.851431846618652, -5.426677703857422, -4.001923561096191, -2.577169418334961, -1.1524152755737305, 0.2723388671875, 1.6970930099487305, 3.121847152709961, 4.546601295471191, 5.971355438232422, 7.396109580993652, 8.820863723754883, 10.245617866516113, 11.670372009277344, 13.095126152038574, 14.519880294799805, 15.944634437561035, 17.369388580322266, 18.794143676757812, 20.218896865844727, 21.64365005493164, 23.068405151367188, 24.493160247802734, 25.91791343688965, 27.342666625976562, 28.76742172241211, 30.192176818847656, 31.61693000793457, 33.041683197021484, 34.46643829345703, 35.89119338989258, 37.315948486328125, 38.740699768066406, 40.16545486450195, 41.5902099609375, 43.01496124267578, 44.43971633911133, 45.864471435546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 8.0, 12.0, 14.0, 16.0, 19.0, 6.0, 20.0, 20.0, 24.0, 21.0, 27.0, 27.0, 27.0, 34.0, 33.0, 49.0, 49.0, 39.0, 46.0, 38.0, 38.0, 47.0, 35.0, 31.0, 31.0, 26.0, 42.0, 31.0, 30.0, 25.0, 25.0, 14.0, 15.0, 12.0, 12.0, 9.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.717620849609375, -2.63446044921875, -2.551300048828125, -2.4681396484375, -2.384979248046875, -2.30181884765625, -2.218658447265625, -2.135498046875, -2.052337646484375, -1.96917724609375, -1.886016845703125, -1.8028564453125, -1.719696044921875, -1.63653564453125, -1.553375244140625, -1.47021484375, -1.387054443359375, -1.30389404296875, -1.220733642578125, -1.1375732421875, -1.054412841796875, -0.97125244140625, -0.888092041015625, -0.804931640625, -0.721771240234375, -0.63861083984375, -0.555450439453125, -0.4722900390625, -0.389129638671875, -0.30596923828125, -0.222808837890625, -0.1396484375, -0.056488037109375, 0.02667236328125, 0.109832763671875, 0.1929931640625, 0.276153564453125, 0.35931396484375, 0.442474365234375, 0.525634765625, 0.608795166015625, 0.69195556640625, 0.775115966796875, 0.8582763671875, 0.941436767578125, 1.02459716796875, 1.107757568359375, 1.19091796875, 1.274078369140625, 1.35723876953125, 1.440399169921875, 1.5235595703125, 1.606719970703125, 1.68988037109375, 1.773040771484375, 1.856201171875, 1.939361572265625, 2.02252197265625, 2.105682373046875, 2.1888427734375, 2.272003173828125, 2.35516357421875, 2.438323974609375, 2.521484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 12.0, 22.0, 20.0, 38.0, 54.0, 86.0, 111.0, 185.0, 245.0, 353.0, 535.0, 776.0, 1130.0, 1632.0, 2470.0, 3559.0, 5528.0, 8482.0, 13039.0, 20233.0, 32698.0, 54002.0, 89584.0, 143711.0, 196412.0, 172581.0, 115594.0, 69889.0, 42308.0, 25868.0, 16247.0, 10269.0, 7023.0, 4536.0, 2999.0, 1964.0, 1356.0, 948.0, 687.0, 440.0, 301.0, 198.0, 137.0, 93.0, 60.0, 50.0, 35.0, 19.0, 11.0, 10.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.306884765625, -0.297515869140625, -0.28814697265625, -0.278778076171875, -0.2694091796875, -0.260040283203125, -0.25067138671875, -0.241302490234375, -0.23193359375, -0.222564697265625, -0.21319580078125, -0.203826904296875, -0.1944580078125, -0.185089111328125, -0.17572021484375, -0.166351318359375, -0.156982421875, -0.147613525390625, -0.13824462890625, -0.128875732421875, -0.1195068359375, -0.110137939453125, -0.10076904296875, -0.091400146484375, -0.08203125, -0.072662353515625, -0.06329345703125, -0.053924560546875, -0.0445556640625, -0.035186767578125, -0.02581787109375, -0.016448974609375, -0.007080078125, 0.002288818359375, 0.01165771484375, 0.021026611328125, 0.0303955078125, 0.039764404296875, 0.04913330078125, 0.058502197265625, 0.06787109375, 0.077239990234375, 0.08660888671875, 0.095977783203125, 0.1053466796875, 0.114715576171875, 0.12408447265625, 0.133453369140625, 0.142822265625, 0.152191162109375, 0.16156005859375, 0.170928955078125, 0.1802978515625, 0.189666748046875, 0.19903564453125, 0.208404541015625, 0.2177734375, 0.227142333984375, 0.23651123046875, 0.245880126953125, 0.2552490234375, 0.264617919921875, 0.27398681640625, 0.283355712890625, 0.292724609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 1.0, 6.0, 7.0, 12.0, 9.0, 9.0, 11.0, 13.0, 18.0, 25.0, 17.0, 17.0, 22.0, 29.0, 28.0, 31.0, 30.0, 33.0, 29.0, 39.0, 37.0, 35.0, 1072.0, 30.0, 36.0, 28.0, 44.0, 43.0, 38.0, 35.0, 27.0, 24.0, 25.0, 22.0, 13.0, 25.0, 18.0, 16.0, 18.0, 8.0, 6.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.7138671875, -1.663970947265625, -1.61407470703125, -1.564178466796875, -1.5142822265625, -1.464385986328125, -1.41448974609375, -1.364593505859375, -1.314697265625, -1.264801025390625, -1.21490478515625, -1.165008544921875, -1.1151123046875, -1.065216064453125, -1.01531982421875, -0.965423583984375, -0.91552734375, -0.865631103515625, -0.81573486328125, -0.765838623046875, -0.7159423828125, -0.666046142578125, -0.61614990234375, -0.566253662109375, -0.516357421875, -0.466461181640625, -0.41656494140625, -0.366668701171875, -0.3167724609375, -0.266876220703125, -0.21697998046875, -0.167083740234375, -0.1171875, -0.067291259765625, -0.01739501953125, 0.032501220703125, 0.0823974609375, 0.132293701171875, 0.18218994140625, 0.232086181640625, 0.281982421875, 0.331878662109375, 0.38177490234375, 0.431671142578125, 0.4815673828125, 0.531463623046875, 0.58135986328125, 0.631256103515625, 0.68115234375, 0.731048583984375, 0.78094482421875, 0.830841064453125, 0.8807373046875, 0.930633544921875, 0.98052978515625, 1.030426025390625, 1.080322265625, 1.130218505859375, 1.18011474609375, 1.230010986328125, 1.2799072265625, 1.329803466796875, 1.37969970703125, 1.429595947265625, 1.4794921875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 5.0, 21.0, 23.0, 36.0, 81.0, 95.0, 150.0, 217.0, 381.0, 587.0, 937.0, 1472.0, 2550.0, 4038.0, 6875.0, 11920.0, 20571.0, 35461.0, 64655.0, 112891.0, 176343.0, 1256137.0, 164676.0, 102401.0, 57449.0, 31951.0, 18485.0, 10683.0, 6339.0, 3710.0, 2318.0, 1384.0, 833.0, 499.0, 331.0, 224.0, 146.0, 85.0, 57.0, 38.0, 21.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.266357421875, -0.25838470458984375, -0.2504119873046875, -0.24243927001953125, -0.234466552734375, -0.22649383544921875, -0.2185211181640625, -0.21054840087890625, -0.20257568359375, -0.19460296630859375, -0.1866302490234375, -0.17865753173828125, -0.170684814453125, -0.16271209716796875, -0.1547393798828125, -0.14676666259765625, -0.1387939453125, -0.13082122802734375, -0.1228485107421875, -0.11487579345703125, -0.106903076171875, -0.09893035888671875, -0.0909576416015625, -0.08298492431640625, -0.07501220703125, -0.06703948974609375, -0.0590667724609375, -0.05109405517578125, -0.043121337890625, -0.03514862060546875, -0.0271759033203125, -0.01920318603515625, -0.01123046875, -0.00325775146484375, 0.0047149658203125, 0.01268768310546875, 0.020660400390625, 0.02863311767578125, 0.0366058349609375, 0.04457855224609375, 0.05255126953125, 0.06052398681640625, 0.0684967041015625, 0.07646942138671875, 0.084442138671875, 0.09241485595703125, 0.1003875732421875, 0.10836029052734375, 0.1163330078125, 0.12430572509765625, 0.1322784423828125, 0.14025115966796875, 0.148223876953125, 0.15619659423828125, 0.1641693115234375, 0.17214202880859375, 0.18011474609375, 0.18808746337890625, 0.1960601806640625, 0.20403289794921875, 0.212005615234375, 0.21997833251953125, 0.2279510498046875, 0.23592376708984375, 0.243896484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 6.0, 3.0, 4.0, 8.0, 7.0, 8.0, 15.0, 12.0, 15.0, 28.0, 22.0, 25.0, 34.0, 41.0, 31.0, 48.0, 45.0, 40.0, 55.0, 54.0, 57.0, 50.0, 53.0, 42.0, 34.0, 48.0, 41.0, 30.0, 28.0, 19.0, 25.0, 16.0, 7.0, 9.0, 10.0, 5.0, 15.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006809234619140625, -0.0006574913859367371, -0.0006340593099594116, -0.0006106272339820862, -0.0005871951580047607, -0.0005637630820274353, -0.0005403310060501099, -0.0005168989300727844, -0.000493466854095459, -0.00047003477811813354, -0.0004466027021408081, -0.00042317062616348267, -0.0003997385501861572, -0.0003763064742088318, -0.00035287439823150635, -0.0003294423222541809, -0.00030601024627685547, -0.00028257817029953003, -0.0002591460943222046, -0.00023571401834487915, -0.0002122819423675537, -0.00018884986639022827, -0.00016541779041290283, -0.0001419857144355774, -0.00011855363845825195, -9.512156248092651e-05, -7.168948650360107e-05, -4.8257410526275635e-05, -2.4825334548950195e-05, -1.3932585716247559e-06, 2.2038817405700684e-05, 4.547089338302612e-05, 6.890296936035156e-05, 9.2335045337677e-05, 0.00011576712131500244, 0.00013919919729232788, 0.00016263127326965332, 0.00018606334924697876, 0.0002094954252243042, 0.00023292750120162964, 0.0002563595771789551, 0.0002797916531562805, 0.00030322372913360596, 0.0003266558051109314, 0.00035008788108825684, 0.0003735199570655823, 0.0003969520330429077, 0.00042038410902023315, 0.0004438161849975586, 0.00046724826097488403, 0.0004906803369522095, 0.0005141124129295349, 0.0005375444889068604, 0.0005609765648841858, 0.0005844086408615112, 0.0006078407168388367, 0.0006312727928161621, 0.0006547048687934875, 0.000678136944770813, 0.0007015690207481384, 0.0007250010967254639, 0.0007484331727027893, 0.0007718652486801147, 0.0007952973246574402, 0.0008187294006347656]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 5.0, 5.0, 6.0, 11.0, 12.0, 16.0, 14.0, 22.0, 26.0, 43.0, 59.0, 68.0, 72.0, 88.0, 107.0, 115.0, 175.0, 193.0, 302.0, 504.0, 1620.0, 976887.0, 65873.0, 757.0, 400.0, 248.0, 210.0, 142.0, 103.0, 100.0, 75.0, 59.0, 55.0, 36.0, 31.0, 23.0, 19.0, 21.0, 10.0, 9.0, 9.0, 12.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01454925537109375, -0.014105558395385742, -0.013661861419677734, -0.013218164443969727, -0.012774467468261719, -0.012330770492553711, -0.011887073516845703, -0.011443376541137695, -0.010999679565429688, -0.01055598258972168, -0.010112285614013672, -0.009668588638305664, -0.009224891662597656, -0.008781194686889648, -0.00833749771118164, -0.007893800735473633, -0.007450103759765625, -0.007006406784057617, -0.006562709808349609, -0.0061190128326416016, -0.005675315856933594, -0.005231618881225586, -0.004787921905517578, -0.00434422492980957, -0.0039005279541015625, -0.0034568309783935547, -0.003013134002685547, -0.002569437026977539, -0.0021257400512695312, -0.0016820430755615234, -0.0012383460998535156, -0.0007946491241455078, -0.0003509521484375, 9.274482727050781e-05, 0.0005364418029785156, 0.0009801387786865234, 0.0014238357543945312, 0.001867532730102539, 0.002311229705810547, 0.0027549266815185547, 0.0031986236572265625, 0.0036423206329345703, 0.004086017608642578, 0.004529714584350586, 0.004973411560058594, 0.0054171085357666016, 0.005860805511474609, 0.006304502487182617, 0.006748199462890625, 0.007191896438598633, 0.007635593414306641, 0.008079290390014648, 0.008522987365722656, 0.008966684341430664, 0.009410381317138672, 0.00985407829284668, 0.010297775268554688, 0.010741472244262695, 0.011185169219970703, 0.011628866195678711, 0.012072563171386719, 0.012516260147094727, 0.012959957122802734, 0.013403654098510742, 0.01384735107421875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 24.0, 606.0, 374.0, 9.0, 2.0, 2.0, 1.0], "bins": [-0.0055391015484929085, -0.005445042159408331, -0.005350982770323753, -0.005256923381239176, -0.005162863992154598, -0.005068804137408733, -0.004974744748324156, -0.004880685359239578, -0.004786625970155001, -0.004692566581070423, -0.0045985071919858456, -0.004504447802901268, -0.0044103884138166904, -0.004316328559070826, -0.004222269169986248, -0.0041282097809016705, -0.004034150391817093, -0.003940091002732515, -0.0038460316136479378, -0.0037519719917327166, -0.003657912602648139, -0.0035638532135635614, -0.003469793824478984, -0.0033757342025637627, -0.0032816750463098288, -0.003187615657225251, -0.0030935562681406736, -0.0029994966462254524, -0.002905437257140875, -0.0028113778680562973, -0.0027173184789717197, -0.002623259089887142, -0.002529199467971921, -0.0024351400788873434, -0.002341080689802766, -0.0022470210678875446, -0.002152961678802967, -0.0020589022897183895, -0.001964842900633812, -0.0018707833951339126, -0.001776724006049335, -0.0016826646169647574, -0.001588605111464858, -0.0014945457223802805, -0.001400486216880381, -0.0013064268277958035, -0.0012123673222959042, -0.0011183079332113266, -0.0010242484277114272, -0.0009301889804191887, -0.0008361295331269503, -0.0007420701440423727, -0.0006480106385424733, -0.0005539512494578958, -0.0004598918021656573, -0.0003658323548734188, -0.0002717729366850108, -0.00017771348939277232, -8.365405665244907e-05, 1.0405376087874174e-05, 0.00010446482338011265, 0.00019852427067235112, 0.00029258368886075914, 0.0003866431361529976, 0.0004807025834452361]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 11.0, 9.0, 10.0, 15.0, 9.0, 15.0, 17.0, 27.0, 21.0, 27.0, 38.0, 38.0, 40.0, 37.0, 44.0, 36.0, 56.0, 43.0, 45.0, 53.0, 48.0, 41.0, 36.0, 36.0, 35.0, 28.0, 35.0, 17.0, 22.0, 17.0, 16.0, 9.0, 15.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00046753883361816406, -0.0004540616646409035, -0.0004405844956636429, -0.0004271073266863823, -0.0004136301577091217, -0.0004001529887318611, -0.0003866758197546005, -0.00037319865077733994, -0.00035972148180007935, -0.00034624431282281876, -0.00033276714384555817, -0.0003192899748682976, -0.000305812805891037, -0.0002923356369137764, -0.0002788584679365158, -0.0002653812989592552, -0.00025190412998199463, -0.00023842696100473404, -0.00022494979202747345, -0.00021147262305021286, -0.00019799545407295227, -0.00018451828509569168, -0.0001710411161184311, -0.0001575639471411705, -0.0001440867781639099, -0.00013060960918664932, -0.00011713244020938873, -0.00010365527123212814, -9.017810225486755e-05, -7.670093327760696e-05, -6.322376430034637e-05, -4.9746595323085785e-05, -3.6269426345825195e-05, -2.2792257368564606e-05, -9.315088391304016e-06, 4.1620805859565735e-06, 1.7639249563217163e-05, 3.111641854047775e-05, 4.459358751773834e-05, 5.807075649499893e-05, 7.154792547225952e-05, 8.502509444952011e-05, 9.85022634267807e-05, 0.00011197943240404129, 0.00012545660138130188, 0.00013893377035856247, 0.00015241093933582306, 0.00016588810831308365, 0.00017936527729034424, 0.00019284244626760483, 0.00020631961524486542, 0.000219796784222126, 0.0002332739531993866, 0.0002467511221766472, 0.0002602282911539078, 0.00027370546013116837, 0.00028718262910842896, 0.00030065979808568954, 0.00031413696706295013, 0.0003276141360402107, 0.0003410913050174713, 0.0003545684739947319, 0.0003680456429719925, 0.0003815228119492531, 0.00039499998092651367]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 8.0, 12.0, 14.0, 16.0, 19.0, 6.0, 20.0, 20.0, 24.0, 21.0, 27.0, 27.0, 27.0, 34.0, 33.0, 49.0, 49.0, 39.0, 46.0, 38.0, 38.0, 47.0, 35.0, 31.0, 31.0, 26.0, 42.0, 31.0, 30.0, 25.0, 25.0, 14.0, 15.0, 12.0, 12.0, 9.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.717620849609375, -2.63446044921875, -2.551300048828125, -2.4681396484375, -2.384979248046875, -2.30181884765625, -2.218658447265625, -2.135498046875, -2.052337646484375, -1.96917724609375, -1.886016845703125, -1.8028564453125, -1.719696044921875, -1.63653564453125, -1.553375244140625, -1.47021484375, -1.387054443359375, -1.30389404296875, -1.220733642578125, -1.1375732421875, -1.054412841796875, -0.97125244140625, -0.888092041015625, -0.804931640625, -0.721771240234375, -0.63861083984375, -0.555450439453125, -0.4722900390625, -0.389129638671875, -0.30596923828125, -0.222808837890625, -0.1396484375, -0.056488037109375, 0.02667236328125, 0.109832763671875, 0.1929931640625, 0.276153564453125, 0.35931396484375, 0.442474365234375, 0.525634765625, 0.608795166015625, 0.69195556640625, 0.775115966796875, 0.8582763671875, 0.941436767578125, 1.02459716796875, 1.107757568359375, 1.19091796875, 1.274078369140625, 1.35723876953125, 1.440399169921875, 1.5235595703125, 1.606719970703125, 1.68988037109375, 1.773040771484375, 1.856201171875, 1.939361572265625, 2.02252197265625, 2.105682373046875, 2.1888427734375, 2.272003173828125, 2.35516357421875, 2.438323974609375, 2.521484375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 11.0, 9.0, 21.0, 27.0, 23.0, 51.0, 48.0, 66.0, 75.0, 118.0, 137.0, 205.0, 289.0, 369.0, 518.0, 704.0, 1015.0, 1360.0, 2194.0, 3378.0, 5427.0, 9746.0, 19933.0, 83465.0, 716898.0, 148796.0, 24586.0, 11022.0, 6254.0, 3825.0, 2416.0, 1666.0, 1110.0, 667.0, 532.0, 420.0, 292.0, 206.0, 162.0, 118.0, 96.0, 70.0, 62.0, 39.0, 26.0, 30.0, 18.0, 15.0, 12.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.1171875, -12.7022705078125, -12.287353515625, -11.8724365234375, -11.45751953125, -11.0426025390625, -10.627685546875, -10.2127685546875, -9.7978515625, -9.3829345703125, -8.968017578125, -8.5531005859375, -8.13818359375, -7.7232666015625, -7.308349609375, -6.8934326171875, -6.478515625, -6.0635986328125, -5.648681640625, -5.2337646484375, -4.81884765625, -4.4039306640625, -3.989013671875, -3.5740966796875, -3.1591796875, -2.7442626953125, -2.329345703125, -1.9144287109375, -1.49951171875, -1.0845947265625, -0.669677734375, -0.2547607421875, 0.16015625, 0.5750732421875, 0.989990234375, 1.4049072265625, 1.81982421875, 2.2347412109375, 2.649658203125, 3.0645751953125, 3.4794921875, 3.8944091796875, 4.309326171875, 4.7242431640625, 5.13916015625, 5.5540771484375, 5.968994140625, 6.3839111328125, 6.798828125, 7.2137451171875, 7.628662109375, 8.0435791015625, 8.45849609375, 8.8734130859375, 9.288330078125, 9.7032470703125, 10.1181640625, 10.5330810546875, 10.947998046875, 11.3629150390625, 11.77783203125, 12.1927490234375, 12.607666015625, 13.0225830078125, 13.4375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 7.0, 10.0, 12.0, 15.0, 27.0, 18.0, 29.0, 30.0, 31.0, 32.0, 31.0, 30.0, 43.0, 42.0, 69.0, 127.0, 311.0, 1490.0, 187.0, 100.0, 67.0, 38.0, 42.0, 33.0, 29.0, 20.0, 27.0, 22.0, 18.0, 18.0, 19.0, 10.0, 8.0, 10.0, 2.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9609375, -8.68310546875, -8.4052734375, -8.12744140625, -7.849609375, -7.57177734375, -7.2939453125, -7.01611328125, -6.73828125, -6.46044921875, -6.1826171875, -5.90478515625, -5.626953125, -5.34912109375, -5.0712890625, -4.79345703125, -4.515625, -4.23779296875, -3.9599609375, -3.68212890625, -3.404296875, -3.12646484375, -2.8486328125, -2.57080078125, -2.29296875, -2.01513671875, -1.7373046875, -1.45947265625, -1.181640625, -0.90380859375, -0.6259765625, -0.34814453125, -0.0703125, 0.20751953125, 0.4853515625, 0.76318359375, 1.041015625, 1.31884765625, 1.5966796875, 1.87451171875, 2.15234375, 2.43017578125, 2.7080078125, 2.98583984375, 3.263671875, 3.54150390625, 3.8193359375, 4.09716796875, 4.375, 4.65283203125, 4.9306640625, 5.20849609375, 5.486328125, 5.76416015625, 6.0419921875, 6.31982421875, 6.59765625, 6.87548828125, 7.1533203125, 7.43115234375, 7.708984375, 7.98681640625, 8.2646484375, 8.54248046875, 8.8203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 13.0, 6.0, 10.0, 11.0, 13.0, 15.0, 23.0, 23.0, 20.0, 19.0, 36.0, 38.0, 43.0, 77.0, 140.0, 389.0, 1828.0, 937768.0, 2202051.0, 2164.0, 420.0, 180.0, 67.0, 57.0, 40.0, 41.0, 30.0, 25.0, 32.0, 23.0, 15.0, 22.0, 10.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-37.46875, -36.26123046875, -35.0537109375, -33.84619140625, -32.638671875, -31.43115234375, -30.2236328125, -29.01611328125, -27.80859375, -26.60107421875, -25.3935546875, -24.18603515625, -22.978515625, -21.77099609375, -20.5634765625, -19.35595703125, -18.1484375, -16.94091796875, -15.7333984375, -14.52587890625, -13.318359375, -12.11083984375, -10.9033203125, -9.69580078125, -8.48828125, -7.28076171875, -6.0732421875, -4.86572265625, -3.658203125, -2.45068359375, -1.2431640625, -0.03564453125, 1.171875, 2.37939453125, 3.5869140625, 4.79443359375, 6.001953125, 7.20947265625, 8.4169921875, 9.62451171875, 10.83203125, 12.03955078125, 13.2470703125, 14.45458984375, 15.662109375, 16.86962890625, 18.0771484375, 19.28466796875, 20.4921875, 21.69970703125, 22.9072265625, 24.11474609375, 25.322265625, 26.52978515625, 27.7373046875, 28.94482421875, 30.15234375, 31.35986328125, 32.5673828125, 33.77490234375, 34.982421875, 36.18994140625, 37.3974609375, 38.60498046875, 39.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 826.0, 191.0, 2.0, 1.0, 1.0], "bins": [-514.5261840820312, -505.9359130859375, -497.34564208984375, -488.75537109375, -480.16510009765625, -471.5748291015625, -462.98455810546875, -454.394287109375, -445.80401611328125, -437.2137451171875, -428.62347412109375, -420.033203125, -411.44293212890625, -402.8526611328125, -394.26239013671875, -385.672119140625, -377.0818176269531, -368.4915466308594, -359.9012756347656, -351.3110046386719, -342.7207336425781, -334.1304626464844, -325.5401916503906, -316.94989013671875, -308.359619140625, -299.76934814453125, -291.1790771484375, -282.58880615234375, -273.99853515625, -265.40826416015625, -256.8179931640625, -248.2277069091797, -239.637451171875, -231.04718017578125, -222.4569091796875, -213.86663818359375, -205.2763671875, -196.68609619140625, -188.09580993652344, -179.5055389404297, -170.91526794433594, -162.3249969482422, -153.73472595214844, -145.1444549560547, -136.55416870117188, -127.96390533447266, -119.37362670898438, -110.78335571289062, -102.19308471679688, -93.60281372070312, -85.01254272460938, -76.4222640991211, -67.83199310302734, -59.241722106933594, -50.65144729614258, -42.06117248535156, -33.47090530395508, -24.880632400512695, -16.290359497070312, -7.70008659362793, 0.8901863098144531, 9.480457305908203, 18.07073211669922, 26.661006927490234, 35.251277923583984]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 7.0, 10.0, 9.0, 6.0, 21.0, 17.0, 11.0, 15.0, 23.0, 30.0, 38.0, 42.0, 29.0, 47.0, 35.0, 39.0, 37.0, 44.0, 48.0, 41.0, 24.0, 42.0, 42.0, 47.0, 40.0, 37.0, 21.0, 32.0, 20.0, 25.0, 16.0, 22.0, 8.0, 16.0, 9.0, 10.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.235851287841797, -29.38324546813965, -28.530641555786133, -27.678035736083984, -26.82543182373047, -25.97282600402832, -25.120220184326172, -24.267616271972656, -23.415010452270508, -22.56240463256836, -21.709800720214844, -20.857194900512695, -20.00459098815918, -19.15198516845703, -18.299381256103516, -17.446775436401367, -16.59416961669922, -15.741564750671387, -14.888959884643555, -14.036354064941406, -13.183749198913574, -12.331144332885742, -11.47853946685791, -10.625934600830078, -9.773330688476562, -8.92072582244873, -8.068120956420898, -7.215515613555908, -6.362910270690918, -5.510305404663086, -4.657700538635254, -3.8050951957702637, -2.9524898529052734, -2.0998847484588623, -1.2472797632217407, -0.39467477798461914, 0.457930326461792, 1.3105354309082031, 2.163140296936035, 3.0157456398010254, 3.8683505058288574, 4.7209553718566895, 5.57356071472168, 6.426165580749512, 7.278770446777344, 8.131376266479492, 8.983980178833008, 9.836585998535156, 10.689190864562988, 11.54179573059082, 12.394400596618652, 13.247005462646484, 14.099611282348633, 14.952216148376465, 15.804821014404297, 16.657426834106445, 17.51003074645996, 18.36263656616211, 19.215240478515625, 20.067846298217773, 20.92045021057129, 21.773056030273438, 22.625659942626953, 23.4782657623291, 24.33087158203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 6.0, 12.0, 16.0, 18.0, 17.0, 14.0, 24.0, 26.0, 20.0, 30.0, 27.0, 36.0, 34.0, 42.0, 38.0, 59.0, 46.0, 46.0, 35.0, 37.0, 30.0, 29.0, 36.0, 38.0, 32.0, 30.0, 35.0, 20.0, 24.0, 17.0, 19.0, 12.0, 13.0, 10.0, 4.0, 8.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.80419921875, -2.7158203125, -2.62744140625, -2.5390625, -2.45068359375, -2.3623046875, -2.27392578125, -2.185546875, -2.09716796875, -2.0087890625, -1.92041015625, -1.83203125, -1.74365234375, -1.6552734375, -1.56689453125, -1.478515625, -1.39013671875, -1.3017578125, -1.21337890625, -1.125, -1.03662109375, -0.9482421875, -0.85986328125, -0.771484375, -0.68310546875, -0.5947265625, -0.50634765625, -0.41796875, -0.32958984375, -0.2412109375, -0.15283203125, -0.064453125, 0.02392578125, 0.1123046875, 0.20068359375, 0.2890625, 0.37744140625, 0.4658203125, 0.55419921875, 0.642578125, 0.73095703125, 0.8193359375, 0.90771484375, 0.99609375, 1.08447265625, 1.1728515625, 1.26123046875, 1.349609375, 1.43798828125, 1.5263671875, 1.61474609375, 1.703125, 1.79150390625, 1.8798828125, 1.96826171875, 2.056640625, 2.14501953125, 2.2333984375, 2.32177734375, 2.41015625, 2.49853515625, 2.5869140625, 2.67529296875, 2.763671875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 15.0, 10.0, 16.0, 13.0, 24.0, 35.0, 57.0, 51.0, 110.0, 111.0, 175.0, 241.0, 354.0, 609.0, 1058.0, 1877.0, 3503.0, 7508.0, 19865.0, 79653.0, 778175.0, 2899368.0, 326942.0, 48385.0, 13945.0, 5637.0, 2744.0, 1466.0, 814.0, 463.0, 298.0, 225.0, 149.0, 104.0, 74.0, 45.0, 39.0, 23.0, 23.0, 14.0, 5.0, 8.0, 12.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-13.7109375, -13.2996826171875, -12.888427734375, -12.4771728515625, -12.06591796875, -11.6546630859375, -11.243408203125, -10.8321533203125, -10.4208984375, -10.0096435546875, -9.598388671875, -9.1871337890625, -8.77587890625, -8.3646240234375, -7.953369140625, -7.5421142578125, -7.130859375, -6.7196044921875, -6.308349609375, -5.8970947265625, -5.48583984375, -5.0745849609375, -4.663330078125, -4.2520751953125, -3.8408203125, -3.4295654296875, -3.018310546875, -2.6070556640625, -2.19580078125, -1.7845458984375, -1.373291015625, -0.9620361328125, -0.55078125, -0.1395263671875, 0.271728515625, 0.6829833984375, 1.09423828125, 1.5054931640625, 1.916748046875, 2.3280029296875, 2.7392578125, 3.1505126953125, 3.561767578125, 3.9730224609375, 4.38427734375, 4.7955322265625, 5.206787109375, 5.6180419921875, 6.029296875, 6.4405517578125, 6.851806640625, 7.2630615234375, 7.67431640625, 8.0855712890625, 8.496826171875, 8.9080810546875, 9.3193359375, 9.7305908203125, 10.141845703125, 10.5531005859375, 10.96435546875, 11.3756103515625, 11.786865234375, 12.1981201171875, 12.609375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 13.0, 11.0, 12.0, 25.0, 45.0, 53.0, 66.0, 92.0, 155.0, 214.0, 324.0, 477.0, 574.0, 604.0, 455.0, 357.0, 205.0, 120.0, 96.0, 60.0, 39.0, 33.0, 22.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.9697265625, -15.470703125, -14.9716796875, -14.47265625, -13.9736328125, -13.474609375, -12.9755859375, -12.4765625, -11.9775390625, -11.478515625, -10.9794921875, -10.48046875, -9.9814453125, -9.482421875, -8.9833984375, -8.484375, -7.9853515625, -7.486328125, -6.9873046875, -6.48828125, -5.9892578125, -5.490234375, -4.9912109375, -4.4921875, -3.9931640625, -3.494140625, -2.9951171875, -2.49609375, -1.9970703125, -1.498046875, -0.9990234375, -0.5, -0.0009765625, 0.498046875, 0.9970703125, 1.49609375, 1.9951171875, 2.494140625, 2.9931640625, 3.4921875, 3.9912109375, 4.490234375, 4.9892578125, 5.48828125, 5.9873046875, 6.486328125, 6.9853515625, 7.484375, 7.9833984375, 8.482421875, 8.9814453125, 9.48046875, 9.9794921875, 10.478515625, 10.9775390625, 11.4765625, 11.9755859375, 12.474609375, 12.9736328125, 13.47265625, 13.9716796875, 14.470703125, 14.9697265625, 15.46875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 11.0, 10.0, 22.0, 25.0, 48.0, 62.0, 108.0, 212.0, 541.0, 2429.0, 1561779.0, 2624873.0, 2872.0, 600.0, 263.0, 153.0, 94.0, 58.0, 42.0, 26.0, 15.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.6474609375, -68.294921875, -65.9423828125, -63.58984375, -61.2373046875, -58.884765625, -56.5322265625, -54.1796875, -51.8271484375, -49.474609375, -47.1220703125, -44.76953125, -42.4169921875, -40.064453125, -37.7119140625, -35.359375, -33.0068359375, -30.654296875, -28.3017578125, -25.94921875, -23.5966796875, -21.244140625, -18.8916015625, -16.5390625, -14.1865234375, -11.833984375, -9.4814453125, -7.12890625, -4.7763671875, -2.423828125, -0.0712890625, 2.28125, 4.6337890625, 6.986328125, 9.3388671875, 11.69140625, 14.0439453125, 16.396484375, 18.7490234375, 21.1015625, 23.4541015625, 25.806640625, 28.1591796875, 30.51171875, 32.8642578125, 35.216796875, 37.5693359375, 39.921875, 42.2744140625, 44.626953125, 46.9794921875, 49.33203125, 51.6845703125, 54.037109375, 56.3896484375, 58.7421875, 61.0947265625, 63.447265625, 65.7998046875, 68.15234375, 70.5048828125, 72.857421875, 75.2099609375, 77.5625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 14.0, 65.0, 237.0, 368.0, 251.0, 67.0, 9.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-164.59982299804688, -161.06324768066406, -157.5266876220703, -153.9901123046875, -150.45355224609375, -146.91697692871094, -143.38040161132812, -139.84384155273438, -136.30726623535156, -132.77069091796875, -129.234130859375, -125.69755554199219, -122.1609878540039, -118.62442016601562, -115.08785247802734, -111.55128479003906, -108.01472473144531, -104.47815704345703, -100.94158935546875, -97.40501403808594, -93.86844635009766, -90.33187866210938, -86.7953109741211, -83.25874328613281, -79.72216796875, -76.18560028076172, -72.64903259277344, -69.11245727539062, -65.57588958740234, -62.03932189941406, -58.50275421142578, -54.9661865234375, -51.42961502075195, -47.89304733276367, -44.356475830078125, -40.819908142089844, -37.28334045410156, -33.74677276611328, -30.210201263427734, -26.673633575439453, -23.13706398010254, -19.600494384765625, -16.063926696777344, -12.52735710144043, -8.990788459777832, -5.454219818115234, -1.9176502227783203, 1.618917465209961, 5.155487060546875, 8.692055702209473, 12.22862434387207, 15.765193939208984, 19.301761627197266, 22.83833122253418, 26.374900817871094, 29.911468505859375, 33.448036193847656, 36.98460388183594, 40.521175384521484, 44.057743072509766, 47.59431076049805, 51.130882263183594, 54.667449951171875, 58.204017639160156, 61.7405891418457]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 12.0, 16.0, 9.0, 12.0, 15.0, 19.0, 21.0, 23.0, 16.0, 31.0, 27.0, 27.0, 38.0, 27.0, 39.0, 25.0, 47.0, 46.0, 51.0, 43.0, 42.0, 39.0, 29.0, 40.0, 41.0, 29.0, 35.0, 23.0, 22.0, 22.0, 16.0, 22.0, 19.0, 14.0, 18.0, 5.0, 6.0, 8.0, 4.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.191436767578125, -43.72285461425781, -42.2542724609375, -40.78569030761719, -39.31710433959961, -37.8485221862793, -36.379940032958984, -34.91135787963867, -33.44277572631836, -31.974193572998047, -30.5056095123291, -29.03702735900879, -27.568445205688477, -26.09986114501953, -24.63127899169922, -23.162696838378906, -21.69411277770996, -20.22553062438965, -18.756946563720703, -17.28836441040039, -15.819782257080078, -14.35119915008545, -12.88261604309082, -11.414033889770508, -9.945450782775879, -8.47686767578125, -7.0082855224609375, -5.539702415466309, -4.071119785308838, -2.602537155151367, -1.1339540481567383, 0.3346281051635742, 1.8032112121582031, 3.271793842315674, 4.7403764724731445, 6.208959579467773, 7.677542209625244, 9.146124839782715, 10.614707946777344, 12.083290100097656, 13.551873207092285, 15.020456314086914, 16.489038467407227, 17.957622528076172, 19.426204681396484, 20.894786834716797, 22.36336898803711, 23.831951141357422, 25.300535202026367, 26.76911735534668, 28.237701416015625, 29.706283569335938, 31.17486572265625, 32.64344787597656, 34.112030029296875, 35.58061218261719, 37.049198150634766, 38.51778030395508, 39.98636245727539, 41.45494842529297, 42.92353057861328, 44.392112731933594, 45.860694885253906, 47.32927703857422, 48.79785919189453]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 9.0, 13.0, 9.0, 10.0, 8.0, 12.0, 20.0, 18.0, 25.0, 17.0, 28.0, 32.0, 26.0, 32.0, 28.0, 35.0, 47.0, 44.0, 38.0, 45.0, 42.0, 36.0, 41.0, 38.0, 37.0, 34.0, 27.0, 45.0, 34.0, 23.0, 21.0, 16.0, 14.0, 20.0, 13.0, 7.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.24609375, -3.1541748046875, -3.062255859375, -2.9703369140625, -2.87841796875, -2.7864990234375, -2.694580078125, -2.6026611328125, -2.5107421875, -2.4188232421875, -2.326904296875, -2.2349853515625, -2.14306640625, -2.0511474609375, -1.959228515625, -1.8673095703125, -1.775390625, -1.6834716796875, -1.591552734375, -1.4996337890625, -1.40771484375, -1.3157958984375, -1.223876953125, -1.1319580078125, -1.0400390625, -0.9481201171875, -0.856201171875, -0.7642822265625, -0.67236328125, -0.5804443359375, -0.488525390625, -0.3966064453125, -0.3046875, -0.2127685546875, -0.120849609375, -0.0289306640625, 0.06298828125, 0.1549072265625, 0.246826171875, 0.3387451171875, 0.4306640625, 0.5225830078125, 0.614501953125, 0.7064208984375, 0.79833984375, 0.8902587890625, 0.982177734375, 1.0740966796875, 1.166015625, 1.2579345703125, 1.349853515625, 1.4417724609375, 1.53369140625, 1.6256103515625, 1.717529296875, 1.8094482421875, 1.9013671875, 1.9932861328125, 2.085205078125, 2.1771240234375, 2.26904296875, 2.3609619140625, 2.452880859375, 2.5447998046875, 2.63671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 26.0, 12.0, 22.0, 40.0, 64.0, 78.0, 112.0, 171.0, 253.0, 286.0, 451.0, 640.0, 872.0, 1294.0, 1803.0, 2484.0, 3595.0, 5346.0, 7594.0, 10895.0, 16436.0, 25164.0, 39452.0, 63357.0, 101761.0, 154299.0, 190031.0, 150290.0, 97954.0, 61078.0, 38199.0, 24456.0, 15732.0, 10227.0, 7310.0, 4843.0, 3519.0, 2424.0, 1798.0, 1163.0, 846.0, 677.0, 452.0, 325.0, 214.0, 150.0, 88.0, 89.0, 55.0, 43.0, 25.0, 25.0, 7.0, 8.0, 6.0, 10.0, 3.0, 3.0], "bins": [-0.296142578125, -0.287017822265625, -0.27789306640625, -0.268768310546875, -0.2596435546875, -0.250518798828125, -0.24139404296875, -0.232269287109375, -0.22314453125, -0.214019775390625, -0.20489501953125, -0.195770263671875, -0.1866455078125, -0.177520751953125, -0.16839599609375, -0.159271240234375, -0.150146484375, -0.141021728515625, -0.13189697265625, -0.122772216796875, -0.1136474609375, -0.104522705078125, -0.09539794921875, -0.086273193359375, -0.0771484375, -0.068023681640625, -0.05889892578125, -0.049774169921875, -0.0406494140625, -0.031524658203125, -0.02239990234375, -0.013275146484375, -0.004150390625, 0.004974365234375, 0.01409912109375, 0.023223876953125, 0.0323486328125, 0.041473388671875, 0.05059814453125, 0.059722900390625, 0.06884765625, 0.077972412109375, 0.08709716796875, 0.096221923828125, 0.1053466796875, 0.114471435546875, 0.12359619140625, 0.132720947265625, 0.141845703125, 0.150970458984375, 0.16009521484375, 0.169219970703125, 0.1783447265625, 0.187469482421875, 0.19659423828125, 0.205718994140625, 0.21484375, 0.223968505859375, 0.23309326171875, 0.242218017578125, 0.2513427734375, 0.260467529296875, 0.26959228515625, 0.278717041015625, 0.287841796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 11.0, 7.0, 8.0, 9.0, 15.0, 21.0, 15.0, 24.0, 26.0, 22.0, 32.0, 28.0, 24.0, 40.0, 38.0, 51.0, 43.0, 43.0, 1071.0, 49.0, 43.0, 43.0, 36.0, 47.0, 40.0, 32.0, 30.0, 28.0, 27.0, 17.0, 24.0, 11.0, 13.0, 10.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.15228271484375, -2.0877685546875, -2.02325439453125, -1.958740234375, -1.89422607421875, -1.8297119140625, -1.76519775390625, -1.70068359375, -1.63616943359375, -1.5716552734375, -1.50714111328125, -1.442626953125, -1.37811279296875, -1.3135986328125, -1.24908447265625, -1.1845703125, -1.12005615234375, -1.0555419921875, -0.99102783203125, -0.926513671875, -0.86199951171875, -0.7974853515625, -0.73297119140625, -0.66845703125, -0.60394287109375, -0.5394287109375, -0.47491455078125, -0.410400390625, -0.34588623046875, -0.2813720703125, -0.21685791015625, -0.15234375, -0.08782958984375, -0.0233154296875, 0.04119873046875, 0.105712890625, 0.17022705078125, 0.2347412109375, 0.29925537109375, 0.36376953125, 0.42828369140625, 0.4927978515625, 0.55731201171875, 0.621826171875, 0.68634033203125, 0.7508544921875, 0.81536865234375, 0.8798828125, 0.94439697265625, 1.0089111328125, 1.07342529296875, 1.137939453125, 1.20245361328125, 1.2669677734375, 1.33148193359375, 1.39599609375, 1.46051025390625, 1.5250244140625, 1.58953857421875, 1.654052734375, 1.71856689453125, 1.7830810546875, 1.84759521484375, 1.912109375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 5.0, 7.0, 8.0, 11.0, 19.0, 34.0, 51.0, 79.0, 115.0, 192.0, 264.0, 424.0, 704.0, 1060.0, 1681.0, 2778.0, 4632.0, 7439.0, 12176.0, 20805.0, 34792.0, 59033.0, 97904.0, 148988.0, 1234082.0, 168918.0, 119160.0, 73449.0, 43673.0, 25545.0, 15276.0, 9227.0, 5485.0, 3399.0, 2082.0, 1329.0, 824.0, 542.0, 309.0, 225.0, 143.0, 92.0, 58.0, 40.0, 21.0, 18.0, 16.0, 4.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.2384357452392578, -0.23041152954101562, -0.22238731384277344, -0.21436309814453125, -0.20633888244628906, -0.19831466674804688, -0.1902904510498047, -0.1822662353515625, -0.1742420196533203, -0.16621780395507812, -0.15819358825683594, -0.15016937255859375, -0.14214515686035156, -0.13412094116210938, -0.1260967254638672, -0.118072509765625, -0.11004829406738281, -0.10202407836914062, -0.09399986267089844, -0.08597564697265625, -0.07795143127441406, -0.06992721557617188, -0.06190299987792969, -0.0538787841796875, -0.04585456848144531, -0.037830352783203125, -0.029806137084960938, -0.02178192138671875, -0.013757705688476562, -0.005733489990234375, 0.0022907257080078125, 0.01031494140625, 0.018339157104492188, 0.026363372802734375, 0.03438758850097656, 0.04241180419921875, 0.05043601989746094, 0.058460235595703125, 0.06648445129394531, 0.0745086669921875, 0.08253288269042969, 0.09055709838867188, 0.09858131408691406, 0.10660552978515625, 0.11462974548339844, 0.12265396118164062, 0.1306781768798828, 0.138702392578125, 0.1467266082763672, 0.15475082397460938, 0.16277503967285156, 0.17079925537109375, 0.17882347106933594, 0.18684768676757812, 0.1948719024658203, 0.2028961181640625, 0.2109203338623047, 0.21894454956054688, 0.22696876525878906, 0.23499298095703125, 0.24301719665527344, 0.2510414123535156, 0.2590656280517578, 0.26708984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 11.0, 15.0, 17.0, 14.0, 31.0, 32.0, 41.0, 34.0, 58.0, 60.0, 81.0, 67.0, 60.0, 62.0, 69.0, 58.0, 62.0, 40.0, 41.0, 31.0, 19.0, 17.0, 19.0, 16.0, 7.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010042190551757812, -0.0009712129831314087, -0.0009382069110870361, -0.0009052008390426636, -0.000872194766998291, -0.0008391886949539185, -0.0008061826229095459, -0.0007731765508651733, -0.0007401704788208008, -0.0007071644067764282, -0.0006741583347320557, -0.0006411522626876831, -0.0006081461906433105, -0.000575140118598938, -0.0005421340465545654, -0.0005091279745101929, -0.0004761219024658203, -0.00044311583042144775, -0.0004101097583770752, -0.00037710368633270264, -0.0003440976142883301, -0.0003110915422439575, -0.00027808547019958496, -0.0002450793981552124, -0.00021207332611083984, -0.00017906725406646729, -0.00014606118202209473, -0.00011305510997772217, -8.004903793334961e-05, -4.704296588897705e-05, -1.4036893844604492e-05, 1.8969178199768066e-05, 5.1975250244140625e-05, 8.498132228851318e-05, 0.00011798739433288574, 0.0001509934663772583, 0.00018399953842163086, 0.00021700561046600342, 0.000250011682510376, 0.00028301775455474854, 0.0003160238265991211, 0.00034902989864349365, 0.0003820359706878662, 0.00041504204273223877, 0.00044804811477661133, 0.0004810541868209839, 0.0005140602588653564, 0.000547066330909729, 0.0005800724029541016, 0.0006130784749984741, 0.0006460845470428467, 0.0006790906190872192, 0.0007120966911315918, 0.0007451027631759644, 0.0007781088352203369, 0.0008111149072647095, 0.000844120979309082, 0.0008771270513534546, 0.0009101331233978271, 0.0009431391954421997, 0.0009761452674865723, 0.0010091513395309448, 0.0010421574115753174, 0.00107516348361969, 0.0011081695556640625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 0.0, 9.0, 6.0, 6.0, 10.0, 7.0, 23.0, 21.0, 39.0, 54.0, 65.0, 95.0, 102.0, 173.0, 235.0, 373.0, 1080.0, 731996.0, 312217.0, 877.0, 355.0, 190.0, 172.0, 115.0, 89.0, 81.0, 42.0, 32.0, 25.0, 18.0, 15.0, 9.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.023345947265625, -0.022696495056152344, -0.022047042846679688, -0.02139759063720703, -0.020748138427734375, -0.02009868621826172, -0.019449234008789062, -0.018799781799316406, -0.01815032958984375, -0.017500877380371094, -0.016851425170898438, -0.01620197296142578, -0.015552520751953125, -0.014903068542480469, -0.014253616333007812, -0.013604164123535156, -0.0129547119140625, -0.012305259704589844, -0.011655807495117188, -0.011006355285644531, -0.010356903076171875, -0.009707450866699219, -0.009057998657226562, -0.008408546447753906, -0.00775909423828125, -0.007109642028808594, -0.0064601898193359375, -0.005810737609863281, -0.005161285400390625, -0.004511833190917969, -0.0038623809814453125, -0.0032129287719726562, -0.0025634765625, -0.0019140243530273438, -0.0012645721435546875, -0.0006151199340820312, 3.4332275390625e-05, 0.0006837844848632812, 0.0013332366943359375, 0.0019826889038085938, 0.00263214111328125, 0.0032815933227539062, 0.0039310455322265625, 0.004580497741699219, 0.005229949951171875, 0.005879402160644531, 0.0065288543701171875, 0.007178306579589844, 0.0078277587890625, 0.008477210998535156, 0.009126663208007812, 0.009776115417480469, 0.010425567626953125, 0.011075019836425781, 0.011724472045898438, 0.012373924255371094, 0.01302337646484375, 0.013672828674316406, 0.014322280883789062, 0.014971733093261719, 0.015621185302734375, 0.01627063751220703, 0.016920089721679688, 0.017569541931152344, 0.018218994140625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 811.0, 207.0, 0.0, 0.0, 1.0], "bins": [-0.017217513173818588, -0.016929911449551582, -0.016642309725284576, -0.01635470800101757, -0.016067106276750565, -0.01577950455248356, -0.015491901896893978, -0.015204300172626972, -0.014916698448359966, -0.01462909672409296, -0.014341494999825954, -0.014053892344236374, -0.013766290619969368, -0.013478688895702362, -0.013191087171435356, -0.01290348544716835, -0.012615883722901344, -0.012328281998634338, -0.012040680274367332, -0.011753078550100327, -0.011465475894510746, -0.01117787417024374, -0.010890272445976734, -0.010602670721709728, -0.010315068066120148, -0.010027466341853142, -0.009739864617586136, -0.00945226289331913, -0.00916466023772955, -0.008877058513462543, -0.008589456789195538, -0.008301855064928532, -0.008014253340661526, -0.00772665161639452, -0.007439049426466227, -0.007151447702199221, -0.006863845977932215, -0.0065762437880039215, -0.006288642063736916, -0.00600104033946991, -0.005713438615202904, -0.005425836890935898, -0.005138234701007605, -0.004850632976740599, -0.004563031252473593, -0.0042754290625452995, -0.003987827338278294, -0.0037002256140112877, -0.0034126238897442818, -0.003125021932646632, -0.0028374202083796263, -0.0025498182512819767, -0.0022622165270149708, -0.001974614569917321, -0.0016870126128196716, -0.0013994108885526657, -0.0011118088150396943, -0.0008242069743573666, -0.0005366050754673779, -0.00024900317657738924, 3.859866410493851e-05, 0.00032620050478726625, 0.0006138024618849158, 0.0009014041861519217, 0.0011890061432495713]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 10.0, 11.0, 19.0, 28.0, 20.0, 22.0, 27.0, 31.0, 34.0, 44.0, 40.0, 28.0, 33.0, 67.0, 42.0, 50.0, 41.0, 54.0, 50.0, 40.0, 47.0, 29.0, 42.0, 31.0, 28.0, 28.0, 19.0, 15.0, 16.0, 10.0, 9.0, 2.0, 8.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046622753143310547, -0.0004495270550251007, -0.00043282657861709595, -0.0004161261022090912, -0.0003994256258010864, -0.00038272514939308167, -0.0003660246729850769, -0.00034932419657707214, -0.0003326237201690674, -0.0003159232437610626, -0.00029922276735305786, -0.0002825222909450531, -0.00026582181453704834, -0.0002491213381290436, -0.00023242086172103882, -0.00021572038531303406, -0.0001990199089050293, -0.00018231943249702454, -0.00016561895608901978, -0.00014891847968101501, -0.00013221800327301025, -0.00011551752686500549, -9.881705045700073e-05, -8.211657404899597e-05, -6.541609764099121e-05, -4.871562123298645e-05, -3.201514482498169e-05, -1.531466841697693e-05, 1.385807991027832e-06, 1.8086284399032593e-05, 3.4786760807037354e-05, 5.1487237215042114e-05, 6.818771362304688e-05, 8.488819003105164e-05, 0.0001015886664390564, 0.00011828914284706116, 0.00013498961925506592, 0.00015169009566307068, 0.00016839057207107544, 0.0001850910484790802, 0.00020179152488708496, 0.00021849200129508972, 0.00023519247770309448, 0.00025189295411109924, 0.000268593430519104, 0.00028529390692710876, 0.0003019943833351135, 0.0003186948597431183, 0.00033539533615112305, 0.0003520958125591278, 0.00036879628896713257, 0.00038549676537513733, 0.0004021972417831421, 0.00041889771819114685, 0.0004355981945991516, 0.00045229867100715637, 0.00046899914741516113, 0.0004856996238231659, 0.0005024001002311707, 0.0005191005766391754, 0.0005358010530471802, 0.0005525015294551849, 0.0005692020058631897, 0.0005859024822711945, 0.0006026029586791992]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 9.0, 13.0, 9.0, 10.0, 8.0, 12.0, 20.0, 18.0, 25.0, 17.0, 28.0, 32.0, 26.0, 32.0, 28.0, 35.0, 47.0, 44.0, 38.0, 45.0, 42.0, 36.0, 41.0, 38.0, 37.0, 34.0, 27.0, 45.0, 34.0, 23.0, 21.0, 16.0, 14.0, 20.0, 13.0, 7.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.24609375, -3.1541748046875, -3.062255859375, -2.9703369140625, -2.87841796875, -2.7864990234375, -2.694580078125, -2.6026611328125, -2.5107421875, -2.4188232421875, -2.326904296875, -2.2349853515625, -2.14306640625, -2.0511474609375, -1.959228515625, -1.8673095703125, -1.775390625, -1.6834716796875, -1.591552734375, -1.4996337890625, -1.40771484375, -1.3157958984375, -1.223876953125, -1.1319580078125, -1.0400390625, -0.9481201171875, -0.856201171875, -0.7642822265625, -0.67236328125, -0.5804443359375, -0.488525390625, -0.3966064453125, -0.3046875, -0.2127685546875, -0.120849609375, -0.0289306640625, 0.06298828125, 0.1549072265625, 0.246826171875, 0.3387451171875, 0.4306640625, 0.5225830078125, 0.614501953125, 0.7064208984375, 0.79833984375, 0.8902587890625, 0.982177734375, 1.0740966796875, 1.166015625, 1.2579345703125, 1.349853515625, 1.4417724609375, 1.53369140625, 1.6256103515625, 1.717529296875, 1.8094482421875, 1.9013671875, 1.9932861328125, 2.085205078125, 2.1771240234375, 2.26904296875, 2.3609619140625, 2.452880859375, 2.5447998046875, 2.63671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 17.0, 22.0, 19.0, 38.0, 38.0, 44.0, 86.0, 114.0, 142.0, 204.0, 281.0, 433.0, 687.0, 1339.0, 2701.0, 6341.0, 17451.0, 52963.0, 173754.0, 423534.0, 249896.0, 77005.0, 24980.0, 8699.0, 3513.0, 1683.0, 885.0, 482.0, 338.0, 260.0, 168.0, 117.0, 70.0, 69.0, 47.0, 32.0, 26.0, 14.0, 13.0, 8.0, 4.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.265625, -3.168609619140625, -3.07159423828125, -2.974578857421875, -2.8775634765625, -2.780548095703125, -2.68353271484375, -2.586517333984375, -2.489501953125, -2.392486572265625, -2.29547119140625, -2.198455810546875, -2.1014404296875, -2.004425048828125, -1.90740966796875, -1.810394287109375, -1.71337890625, -1.616363525390625, -1.51934814453125, -1.422332763671875, -1.3253173828125, -1.228302001953125, -1.13128662109375, -1.034271240234375, -0.937255859375, -0.840240478515625, -0.74322509765625, -0.646209716796875, -0.5491943359375, -0.452178955078125, -0.35516357421875, -0.258148193359375, -0.1611328125, -0.064117431640625, 0.03289794921875, 0.129913330078125, 0.2269287109375, 0.323944091796875, 0.42095947265625, 0.517974853515625, 0.614990234375, 0.712005615234375, 0.80902099609375, 0.906036376953125, 1.0030517578125, 1.100067138671875, 1.19708251953125, 1.294097900390625, 1.39111328125, 1.488128662109375, 1.58514404296875, 1.682159423828125, 1.7791748046875, 1.876190185546875, 1.97320556640625, 2.070220947265625, 2.167236328125, 2.264251708984375, 2.36126708984375, 2.458282470703125, 2.5552978515625, 2.652313232421875, 2.74932861328125, 2.846343994140625, 2.943359375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 5.0, 5.0, 9.0, 9.0, 10.0, 13.0, 13.0, 19.0, 22.0, 22.0, 34.0, 24.0, 20.0, 32.0, 38.0, 27.0, 38.0, 65.0, 66.0, 223.0, 1598.0, 241.0, 82.0, 50.0, 49.0, 37.0, 29.0, 44.0, 38.0, 29.0, 28.0, 22.0, 18.0, 12.0, 17.0, 10.0, 9.0, 10.0, 5.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.828125, -10.5054931640625, -10.182861328125, -9.8602294921875, -9.53759765625, -9.2149658203125, -8.892333984375, -8.5697021484375, -8.2470703125, -7.9244384765625, -7.601806640625, -7.2791748046875, -6.95654296875, -6.6339111328125, -6.311279296875, -5.9886474609375, -5.666015625, -5.3433837890625, -5.020751953125, -4.6981201171875, -4.37548828125, -4.0528564453125, -3.730224609375, -3.4075927734375, -3.0849609375, -2.7623291015625, -2.439697265625, -2.1170654296875, -1.79443359375, -1.4718017578125, -1.149169921875, -0.8265380859375, -0.50390625, -0.1812744140625, 0.141357421875, 0.4639892578125, 0.78662109375, 1.1092529296875, 1.431884765625, 1.7545166015625, 2.0771484375, 2.3997802734375, 2.722412109375, 3.0450439453125, 3.36767578125, 3.6903076171875, 4.012939453125, 4.3355712890625, 4.658203125, 4.9808349609375, 5.303466796875, 5.6260986328125, 5.94873046875, 6.2713623046875, 6.593994140625, 6.9166259765625, 7.2392578125, 7.5618896484375, 7.884521484375, 8.2071533203125, 8.52978515625, 8.8524169921875, 9.175048828125, 9.4976806640625, 9.8203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 14.0, 13.0, 11.0, 17.0, 18.0, 39.0, 30.0, 38.0, 60.0, 69.0, 95.0, 160.0, 343.0, 964.0, 10441.0, 3094080.0, 36668.0, 1454.0, 469.0, 190.0, 116.0, 70.0, 60.0, 43.0, 33.0, 25.0, 28.0, 28.0, 22.0, 13.0, 7.0, 10.0, 11.0, 7.0, 4.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.7802734375, -21.044921875, -20.3095703125, -19.57421875, -18.8388671875, -18.103515625, -17.3681640625, -16.6328125, -15.8974609375, -15.162109375, -14.4267578125, -13.69140625, -12.9560546875, -12.220703125, -11.4853515625, -10.75, -10.0146484375, -9.279296875, -8.5439453125, -7.80859375, -7.0732421875, -6.337890625, -5.6025390625, -4.8671875, -4.1318359375, -3.396484375, -2.6611328125, -1.92578125, -1.1904296875, -0.455078125, 0.2802734375, 1.015625, 1.7509765625, 2.486328125, 3.2216796875, 3.95703125, 4.6923828125, 5.427734375, 6.1630859375, 6.8984375, 7.6337890625, 8.369140625, 9.1044921875, 9.83984375, 10.5751953125, 11.310546875, 12.0458984375, 12.78125, 13.5166015625, 14.251953125, 14.9873046875, 15.72265625, 16.4580078125, 17.193359375, 17.9287109375, 18.6640625, 19.3994140625, 20.134765625, 20.8701171875, 21.60546875, 22.3408203125, 23.076171875, 23.8115234375, 24.546875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [572.0, 445.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.790811061859131, 0.052968740463256836, 3.8967485427856445, 7.740528583526611, 11.584308624267578, 15.42808723449707, 19.271867752075195, 23.115646362304688, 26.959426879882812, 30.803207397460938, 34.64698791503906, 38.49076843261719, 42.33454513549805, 46.17832565307617, 50.0221061706543, 53.865882873535156, 57.70966720581055, 61.55344772338867, 65.39722442626953, 69.24100494384766, 73.08478546142578, 76.9285659790039, 80.77234649658203, 84.61612701416016, 88.45990753173828, 92.3036880493164, 96.14746856689453, 99.99124908447266, 103.83502960205078, 107.67880249023438, 111.5225830078125, 115.36636352539062, 119.21013641357422, 123.05391693115234, 126.89769744873047, 130.74147033691406, 134.5852508544922, 138.4290313720703, 142.27281188964844, 146.11659240722656, 149.9603729248047, 153.8041534423828, 157.64793395996094, 161.49171447753906, 165.3354949951172, 169.1792755126953, 173.02305603027344, 176.86683654785156, 180.7106170654297, 184.5543975830078, 188.39817810058594, 192.24195861816406, 196.0857391357422, 199.9295196533203, 203.77330017089844, 207.61708068847656, 211.46084594726562, 215.30462646484375, 219.14840698242188, 222.9921875, 226.83596801757812, 230.67974853515625, 234.52352905273438, 238.3673095703125, 242.21109008789062]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 8.0, 7.0, 13.0, 19.0, 24.0, 16.0, 30.0, 23.0, 27.0, 27.0, 34.0, 46.0, 34.0, 32.0, 43.0, 50.0, 37.0, 58.0, 38.0, 46.0, 44.0, 41.0, 37.0, 37.0, 30.0, 25.0, 20.0, 19.0, 13.0, 12.0, 12.0, 16.0, 13.0, 6.0, 9.0, 7.0, 1.0, 4.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.27735137939453, -33.21554946899414, -32.153743743896484, -31.091941833496094, -30.030139923095703, -28.96833610534668, -27.906532287597656, -26.844730377197266, -25.782926559448242, -24.72112274169922, -23.659320831298828, -22.597517013549805, -21.53571319580078, -20.47391128540039, -19.412107467651367, -18.350303649902344, -17.288501739501953, -16.22669792175293, -15.164896011352539, -14.103092193603516, -13.041289329528809, -11.979486465454102, -10.917682647705078, -9.855879783630371, -8.794076919555664, -7.732274055480957, -6.670470714569092, -5.608667373657227, -4.5468645095825195, -3.4850616455078125, -2.4232583045959473, -1.361454963684082, -0.299652099609375, 0.7621510028839111, 1.8239541053771973, 2.8857572078704834, 3.9475603103637695, 5.009363174438477, 6.071166515350342, 7.132969856262207, 8.194772720336914, 9.256575584411621, 10.318378448486328, 11.380182266235352, 12.441985130310059, 13.503787994384766, 14.565591812133789, 15.627394676208496, 16.689197540283203, 17.751001358032227, 18.812803268432617, 19.87460708618164, 20.93640899658203, 21.998212814331055, 23.060016632080078, 24.12181854248047, 25.183622360229492, 26.245426177978516, 27.307228088378906, 28.36903190612793, 29.430835723876953, 30.492637634277344, 31.554441452026367, 32.61624526977539, 33.67804718017578]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 5.0, 7.0, 8.0, 13.0, 9.0, 9.0, 12.0, 17.0, 18.0, 19.0, 16.0, 25.0, 22.0, 32.0, 27.0, 22.0, 35.0, 36.0, 40.0, 40.0, 30.0, 48.0, 36.0, 45.0, 34.0, 34.0, 30.0, 46.0, 31.0, 25.0, 38.0, 30.0, 23.0, 19.0, 17.0, 10.0, 19.0, 6.0, 10.0, 17.0, 6.0, 4.0, 8.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.048828125, -2.96026611328125, -2.8717041015625, -2.78314208984375, -2.694580078125, -2.60601806640625, -2.5174560546875, -2.42889404296875, -2.34033203125, -2.25177001953125, -2.1632080078125, -2.07464599609375, -1.986083984375, -1.89752197265625, -1.8089599609375, -1.72039794921875, -1.6318359375, -1.54327392578125, -1.4547119140625, -1.36614990234375, -1.277587890625, -1.18902587890625, -1.1004638671875, -1.01190185546875, -0.92333984375, -0.83477783203125, -0.7462158203125, -0.65765380859375, -0.569091796875, -0.48052978515625, -0.3919677734375, -0.30340576171875, -0.21484375, -0.12628173828125, -0.0377197265625, 0.05084228515625, 0.139404296875, 0.22796630859375, 0.3165283203125, 0.40509033203125, 0.49365234375, 0.58221435546875, 0.6707763671875, 0.75933837890625, 0.847900390625, 0.93646240234375, 1.0250244140625, 1.11358642578125, 1.2021484375, 1.29071044921875, 1.3792724609375, 1.46783447265625, 1.556396484375, 1.64495849609375, 1.7335205078125, 1.82208251953125, 1.91064453125, 1.99920654296875, 2.0877685546875, 2.17633056640625, 2.264892578125, 2.35345458984375, 2.4420166015625, 2.53057861328125, 2.619140625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 6.0, 7.0, 13.0, 10.0, 18.0, 12.0, 20.0, 25.0, 19.0, 44.0, 53.0, 42.0, 63.0, 90.0, 159.0, 295.0, 731.0, 2591.0, 15352.0, 141118.0, 2084101.0, 1811594.0, 120235.0, 13506.0, 2552.0, 743.0, 305.0, 142.0, 121.0, 63.0, 36.0, 38.0, 41.0, 21.0, 22.0, 22.0, 17.0, 7.0, 8.0, 6.0, 6.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3673095703125, -11.000244140625, -10.6331787109375, -10.26611328125, -9.8990478515625, -9.531982421875, -9.1649169921875, -8.7978515625, -8.4307861328125, -8.063720703125, -7.6966552734375, -7.32958984375, -6.9625244140625, -6.595458984375, -6.2283935546875, -5.861328125, -5.4942626953125, -5.127197265625, -4.7601318359375, -4.39306640625, -4.0260009765625, -3.658935546875, -3.2918701171875, -2.9248046875, -2.5577392578125, -2.190673828125, -1.8236083984375, -1.45654296875, -1.0894775390625, -0.722412109375, -0.3553466796875, 0.01171875, 0.3787841796875, 0.745849609375, 1.1129150390625, 1.47998046875, 1.8470458984375, 2.214111328125, 2.5811767578125, 2.9482421875, 3.3153076171875, 3.682373046875, 4.0494384765625, 4.41650390625, 4.7835693359375, 5.150634765625, 5.5177001953125, 5.884765625, 6.2518310546875, 6.618896484375, 6.9859619140625, 7.35302734375, 7.7200927734375, 8.087158203125, 8.4542236328125, 8.8212890625, 9.1883544921875, 9.555419921875, 9.9224853515625, 10.28955078125, 10.6566162109375, 11.023681640625, 11.3907470703125, 11.7578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 18.0, 28.0, 36.0, 46.0, 64.0, 121.0, 139.0, 222.0, 293.0, 400.0, 489.0, 509.0, 458.0, 362.0, 257.0, 184.0, 137.0, 85.0, 59.0, 44.0, 37.0, 17.0, 18.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1605224609375, -11.758544921875, -11.3565673828125, -10.95458984375, -10.5526123046875, -10.150634765625, -9.7486572265625, -9.3466796875, -8.9447021484375, -8.542724609375, -8.1407470703125, -7.73876953125, -7.3367919921875, -6.934814453125, -6.5328369140625, -6.130859375, -5.7288818359375, -5.326904296875, -4.9249267578125, -4.52294921875, -4.1209716796875, -3.718994140625, -3.3170166015625, -2.9150390625, -2.5130615234375, -2.111083984375, -1.7091064453125, -1.30712890625, -0.9051513671875, -0.503173828125, -0.1011962890625, 0.30078125, 0.7027587890625, 1.104736328125, 1.5067138671875, 1.90869140625, 2.3106689453125, 2.712646484375, 3.1146240234375, 3.5166015625, 3.9185791015625, 4.320556640625, 4.7225341796875, 5.12451171875, 5.5264892578125, 5.928466796875, 6.3304443359375, 6.732421875, 7.1343994140625, 7.536376953125, 7.9383544921875, 8.34033203125, 8.7423095703125, 9.144287109375, 9.5462646484375, 9.9482421875, 10.3502197265625, 10.752197265625, 11.1541748046875, 11.55615234375, 11.9581298828125, 12.360107421875, 12.7620849609375, 13.1640625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 7.0, 16.0, 17.0, 31.0, 55.0, 58.0, 93.0, 142.0, 268.0, 591.0, 2039.0, 24765.0, 2410212.0, 1733886.0, 19134.0, 1708.0, 523.0, 265.0, 142.0, 90.0, 58.0, 53.0, 40.0, 14.0, 10.0, 13.0, 8.0, 6.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -33.318359375, -32.16796875, -31.017578125, -29.8671875, -28.716796875, -27.56640625, -26.416015625, -25.265625, -24.115234375, -22.96484375, -21.814453125, -20.6640625, -19.513671875, -18.36328125, -17.212890625, -16.0625, -14.912109375, -13.76171875, -12.611328125, -11.4609375, -10.310546875, -9.16015625, -8.009765625, -6.859375, -5.708984375, -4.55859375, -3.408203125, -2.2578125, -1.107421875, 0.04296875, 1.193359375, 2.34375, 3.494140625, 4.64453125, 5.794921875, 6.9453125, 8.095703125, 9.24609375, 10.396484375, 11.546875, 12.697265625, 13.84765625, 14.998046875, 16.1484375, 17.298828125, 18.44921875, 19.599609375, 20.75, 21.900390625, 23.05078125, 24.201171875, 25.3515625, 26.501953125, 27.65234375, 28.802734375, 29.953125, 31.103515625, 32.25390625, 33.404296875, 34.5546875, 35.705078125, 36.85546875, 38.005859375, 39.15625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 54.0, 206.0, 385.0, 259.0, 77.0, 19.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.69924926757812, -65.49522399902344, -61.291194915771484, -57.08716583251953, -52.883140563964844, -48.679115295410156, -44.4750862121582, -40.27105712890625, -36.06703186035156, -31.863004684448242, -27.658977508544922, -23.4549503326416, -19.25092315673828, -15.046895980834961, -10.84286880493164, -6.63884162902832, -2.434814453125, 1.7692127227783203, 5.973239898681641, 10.177267074584961, 14.381294250488281, 18.5853214263916, 22.789348602294922, 26.993375778198242, 31.197402954101562, 35.40142822265625, 39.6054573059082, 43.809486389160156, 48.013511657714844, 52.21753692626953, 56.421566009521484, 60.62559509277344, 64.82963562011719, 69.03366088867188, 73.23768615722656, 77.44171905517578, 81.64574432373047, 85.84976959228516, 90.05380249023438, 94.25782775878906, 98.46185302734375, 102.66587829589844, 106.86990356445312, 111.07393646240234, 115.27796173095703, 119.48198699951172, 123.68601989746094, 127.89004516601562, 132.0940704345703, 136.298095703125, 140.5021209716797, 144.70614624023438, 148.91018676757812, 153.1142120361328, 157.3182373046875, 161.5222625732422, 165.72628784179688, 169.93031311035156, 174.13433837890625, 178.33836364746094, 182.54238891601562, 186.74642944335938, 190.95045471191406, 195.15447998046875, 199.35850524902344]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 9.0, 15.0, 12.0, 19.0, 22.0, 26.0, 22.0, 27.0, 27.0, 38.0, 38.0, 34.0, 42.0, 37.0, 42.0, 35.0, 49.0, 45.0, 52.0, 40.0, 26.0, 30.0, 28.0, 35.0, 32.0, 27.0, 25.0, 27.0, 24.0, 21.0, 16.0, 8.0, 10.0, 10.0, 12.0, 6.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.288360595703125, -33.15347671508789, -32.01859664916992, -30.88371467590332, -29.74883270263672, -28.613948822021484, -27.479066848754883, -26.34418487548828, -25.20930290222168, -24.074420928955078, -22.939538955688477, -21.804656982421875, -20.66977310180664, -19.534893035888672, -18.400009155273438, -17.265127182006836, -16.130245208740234, -14.995363235473633, -13.860481262207031, -12.725598335266113, -11.590716361999512, -10.45583438873291, -9.320951461791992, -8.18606948852539, -7.051187515258789, -5.9163055419921875, -4.781423091888428, -3.646540880203247, -2.5116586685180664, -1.3767766952514648, -0.24189424514770508, 0.8929882049560547, 2.0278701782226562, 3.162752389907837, 4.297634601593018, 5.432517051696777, 6.567399024963379, 7.7022809982299805, 8.837163925170898, 9.9720458984375, 11.106927871704102, 12.241809844970703, 13.376691818237305, 14.511574745178223, 15.646456718444824, 16.78133773803711, 17.916221618652344, 19.051103591918945, 20.185985565185547, 21.32086753845215, 22.45574951171875, 23.59063148498535, 24.725513458251953, 25.860397338867188, 26.99527931213379, 28.13016128540039, 29.265043258666992, 30.399925231933594, 31.534807205200195, 32.6696891784668, 33.80457305908203, 34.939453125, 36.074337005615234, 37.20922088623047, 38.34410095214844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 14.0, 20.0, 9.0, 18.0, 22.0, 27.0, 26.0, 26.0, 41.0, 29.0, 36.0, 42.0, 40.0, 39.0, 45.0, 52.0, 40.0, 53.0, 42.0, 40.0, 30.0, 27.0, 34.0, 25.0, 29.0, 27.0, 20.0, 28.0, 14.0, 15.0, 12.0, 6.0, 7.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.439300537109375, -3.33563232421875, -3.231964111328125, -3.1282958984375, -3.024627685546875, -2.92095947265625, -2.817291259765625, -2.713623046875, -2.609954833984375, -2.50628662109375, -2.402618408203125, -2.2989501953125, -2.195281982421875, -2.09161376953125, -1.987945556640625, -1.88427734375, -1.780609130859375, -1.67694091796875, -1.573272705078125, -1.4696044921875, -1.365936279296875, -1.26226806640625, -1.158599853515625, -1.054931640625, -0.951263427734375, -0.84759521484375, -0.743927001953125, -0.6402587890625, -0.536590576171875, -0.43292236328125, -0.329254150390625, -0.2255859375, -0.121917724609375, -0.01824951171875, 0.085418701171875, 0.1890869140625, 0.292755126953125, 0.39642333984375, 0.500091552734375, 0.603759765625, 0.707427978515625, 0.81109619140625, 0.914764404296875, 1.0184326171875, 1.122100830078125, 1.22576904296875, 1.329437255859375, 1.43310546875, 1.536773681640625, 1.64044189453125, 1.744110107421875, 1.8477783203125, 1.951446533203125, 2.05511474609375, 2.158782958984375, 2.262451171875, 2.366119384765625, 2.46978759765625, 2.573455810546875, 2.6771240234375, 2.780792236328125, 2.88446044921875, 2.988128662109375, 3.091796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 20.0, 17.0, 33.0, 41.0, 79.0, 113.0, 196.0, 240.0, 360.0, 563.0, 835.0, 1352.0, 2025.0, 2924.0, 4491.0, 6314.0, 9856.0, 14548.0, 22662.0, 35057.0, 56287.0, 89834.0, 140233.0, 187482.0, 165258.0, 112151.0, 69939.0, 44297.0, 27686.0, 18066.0, 11898.0, 7788.0, 5290.0, 3497.0, 2341.0, 1615.0, 1048.0, 703.0, 482.0, 296.0, 215.0, 135.0, 83.0, 65.0, 44.0, 40.0, 23.0, 11.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0], "bins": [-0.3388671875, -0.3288230895996094, -0.31877899169921875, -0.3087348937988281, -0.2986907958984375, -0.2886466979980469, -0.27860260009765625, -0.2685585021972656, -0.258514404296875, -0.24847030639648438, -0.23842620849609375, -0.22838211059570312, -0.2183380126953125, -0.20829391479492188, -0.19824981689453125, -0.18820571899414062, -0.17816162109375, -0.16811752319335938, -0.15807342529296875, -0.14802932739257812, -0.1379852294921875, -0.12794113159179688, -0.11789703369140625, -0.10785293579101562, -0.097808837890625, -0.08776473999023438, -0.07772064208984375, -0.06767654418945312, -0.0576324462890625, -0.047588348388671875, -0.03754425048828125, -0.027500152587890625, -0.0174560546875, -0.007411956787109375, 0.00263214111328125, 0.012676239013671875, 0.0227203369140625, 0.032764434814453125, 0.04280853271484375, 0.052852630615234375, 0.062896728515625, 0.07294082641601562, 0.08298492431640625, 0.09302902221679688, 0.1030731201171875, 0.11311721801757812, 0.12316131591796875, 0.13320541381835938, 0.14324951171875, 0.15329360961914062, 0.16333770751953125, 0.17338180541992188, 0.1834259033203125, 0.19347000122070312, 0.20351409912109375, 0.21355819702148438, 0.223602294921875, 0.23364639282226562, 0.24369049072265625, 0.2537345886230469, 0.2637786865234375, 0.2738227844238281, 0.28386688232421875, 0.2939109802246094, 0.303955078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 10.0, 9.0, 10.0, 14.0, 13.0, 19.0, 13.0, 16.0, 20.0, 22.0, 30.0, 35.0, 33.0, 31.0, 32.0, 36.0, 33.0, 32.0, 36.0, 1072.0, 32.0, 49.0, 29.0, 27.0, 38.0, 32.0, 31.0, 37.0, 32.0, 34.0, 19.0, 20.0, 14.0, 16.0, 19.0, 12.0, 9.0, 14.0, 9.0, 5.0, 4.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.11328125, -2.05145263671875, -1.9896240234375, -1.92779541015625, -1.865966796875, -1.80413818359375, -1.7423095703125, -1.68048095703125, -1.61865234375, -1.55682373046875, -1.4949951171875, -1.43316650390625, -1.371337890625, -1.30950927734375, -1.2476806640625, -1.18585205078125, -1.1240234375, -1.06219482421875, -1.0003662109375, -0.93853759765625, -0.876708984375, -0.81488037109375, -0.7530517578125, -0.69122314453125, -0.62939453125, -0.56756591796875, -0.5057373046875, -0.44390869140625, -0.382080078125, -0.32025146484375, -0.2584228515625, -0.19659423828125, -0.134765625, -0.07293701171875, -0.0111083984375, 0.05072021484375, 0.112548828125, 0.17437744140625, 0.2362060546875, 0.29803466796875, 0.35986328125, 0.42169189453125, 0.4835205078125, 0.54534912109375, 0.607177734375, 0.66900634765625, 0.7308349609375, 0.79266357421875, 0.8544921875, 0.91632080078125, 0.9781494140625, 1.03997802734375, 1.101806640625, 1.16363525390625, 1.2254638671875, 1.28729248046875, 1.34912109375, 1.41094970703125, 1.4727783203125, 1.53460693359375, 1.596435546875, 1.65826416015625, 1.7200927734375, 1.78192138671875, 1.84375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 6.0, 17.0, 21.0, 32.0, 42.0, 67.0, 78.0, 157.0, 227.0, 278.0, 494.0, 779.0, 1167.0, 1898.0, 2909.0, 4608.0, 7244.0, 11929.0, 18915.0, 30836.0, 50917.0, 85678.0, 133883.0, 1148261.0, 255115.0, 130140.0, 82422.0, 49731.0, 29689.0, 18571.0, 11286.0, 7171.0, 4518.0, 2885.0, 1858.0, 1176.0, 720.0, 501.0, 299.0, 223.0, 115.0, 94.0, 67.0, 31.0, 28.0, 19.0, 5.0, 8.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.266845703125, -0.25875091552734375, -0.2506561279296875, -0.24256134033203125, -0.234466552734375, -0.22637176513671875, -0.2182769775390625, -0.21018218994140625, -0.20208740234375, -0.19399261474609375, -0.1858978271484375, -0.17780303955078125, -0.169708251953125, -0.16161346435546875, -0.1535186767578125, -0.14542388916015625, -0.1373291015625, -0.12923431396484375, -0.1211395263671875, -0.11304473876953125, -0.104949951171875, -0.09685516357421875, -0.0887603759765625, -0.08066558837890625, -0.07257080078125, -0.06447601318359375, -0.0563812255859375, -0.04828643798828125, -0.040191650390625, -0.03209686279296875, -0.0240020751953125, -0.01590728759765625, -0.0078125, 0.00028228759765625, 0.0083770751953125, 0.01647186279296875, 0.024566650390625, 0.03266143798828125, 0.0407562255859375, 0.04885101318359375, 0.05694580078125, 0.06504058837890625, 0.0731353759765625, 0.08123016357421875, 0.089324951171875, 0.09741973876953125, 0.1055145263671875, 0.11360931396484375, 0.1217041015625, 0.12979888916015625, 0.1378936767578125, 0.14598846435546875, 0.154083251953125, 0.16217803955078125, 0.1702728271484375, 0.17836761474609375, 0.18646240234375, 0.19455718994140625, 0.2026519775390625, 0.21074676513671875, 0.218841552734375, 0.22693634033203125, 0.2350311279296875, 0.24312591552734375, 0.251220703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 12.0, 15.0, 7.0, 17.0, 26.0, 17.0, 28.0, 26.0, 24.0, 41.0, 47.0, 40.0, 44.0, 44.0, 49.0, 39.0, 51.0, 46.0, 50.0, 45.0, 45.0, 38.0, 42.0, 33.0, 27.0, 23.0, 20.0, 19.0, 16.0, 12.0, 9.0, 4.0, 8.0, 1.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0008268356323242188, -0.0008020699024200439, -0.0007773041725158691, -0.0007525384426116943, -0.0007277727127075195, -0.0007030069828033447, -0.0006782412528991699, -0.0006534755229949951, -0.0006287097930908203, -0.0006039440631866455, -0.0005791783332824707, -0.0005544126033782959, -0.0005296468734741211, -0.0005048811435699463, -0.0004801154136657715, -0.0004553496837615967, -0.0004305839538574219, -0.00040581822395324707, -0.00038105249404907227, -0.00035628676414489746, -0.00033152103424072266, -0.00030675530433654785, -0.00028198957443237305, -0.00025722384452819824, -0.00023245811462402344, -0.00020769238471984863, -0.00018292665481567383, -0.00015816092491149902, -0.00013339519500732422, -0.00010862946510314941, -8.386373519897461e-05, -5.9098005294799805e-05, -3.4332275390625e-05, -9.566545486450195e-06, 1.519918441772461e-05, 3.9964914321899414e-05, 6.473064422607422e-05, 8.949637413024902e-05, 0.00011426210403442383, 0.00013902783393859863, 0.00016379356384277344, 0.00018855929374694824, 0.00021332502365112305, 0.00023809075355529785, 0.00026285648345947266, 0.00028762221336364746, 0.00031238794326782227, 0.00033715367317199707, 0.0003619194030761719, 0.0003866851329803467, 0.0004114508628845215, 0.0004362165927886963, 0.0004609823226928711, 0.0004857480525970459, 0.0005105137825012207, 0.0005352795124053955, 0.0005600452423095703, 0.0005848109722137451, 0.0006095767021179199, 0.0006343424320220947, 0.0006591081619262695, 0.0006838738918304443, 0.0007086396217346191, 0.0007334053516387939, 0.0007581710815429688]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 10.0, 15.0, 14.0, 16.0, 34.0, 32.0, 52.0, 56.0, 65.0, 87.0, 114.0, 144.0, 227.0, 323.0, 804.0, 37304.0, 1001516.0, 6052.0, 555.0, 294.0, 199.0, 127.0, 94.0, 82.0, 86.0, 57.0, 26.0, 33.0, 18.0, 30.0, 15.0, 19.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0169219970703125, -0.016398906707763672, -0.015875816345214844, -0.015352725982666016, -0.014829635620117188, -0.01430654525756836, -0.013783454895019531, -0.013260364532470703, -0.012737274169921875, -0.012214183807373047, -0.011691093444824219, -0.01116800308227539, -0.010644912719726562, -0.010121822357177734, -0.009598731994628906, -0.009075641632080078, -0.00855255126953125, -0.008029460906982422, -0.007506370544433594, -0.006983280181884766, -0.0064601898193359375, -0.005937099456787109, -0.005414009094238281, -0.004890918731689453, -0.004367828369140625, -0.003844738006591797, -0.0033216476440429688, -0.0027985572814941406, -0.0022754669189453125, -0.0017523765563964844, -0.0012292861938476562, -0.0007061958312988281, -0.00018310546875, 0.0003399848937988281, 0.0008630752563476562, 0.0013861656188964844, 0.0019092559814453125, 0.0024323463439941406, 0.0029554367065429688, 0.003478527069091797, 0.004001617431640625, 0.004524707794189453, 0.005047798156738281, 0.005570888519287109, 0.0060939788818359375, 0.006617069244384766, 0.007140159606933594, 0.007663249969482422, 0.00818634033203125, 0.008709430694580078, 0.009232521057128906, 0.009755611419677734, 0.010278701782226562, 0.01080179214477539, 0.011324882507324219, 0.011847972869873047, 0.012371063232421875, 0.012894153594970703, 0.013417243957519531, 0.01394033432006836, 0.014463424682617188, 0.014986515045166016, 0.015509605407714844, 0.016032695770263672, 0.0165557861328125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 44.0, 90.0, 185.0, 277.0, 208.0, 122.0, 48.0, 18.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.002124866470694542, -0.002086655469611287, -0.0020484444685280323, -0.0020102334674447775, -0.0019720224663615227, -0.0019338115816935897, -0.0018956005806103349, -0.0018573896959424019, -0.001819178694859147, -0.0017809676937758923, -0.0017427566926926374, -0.0017045458080247045, -0.0016663348069414496, -0.0016281238058581948, -0.00158991280477494, -0.001551701920107007, -0.0015134909190237522, -0.0014752799179404974, -0.0014370689168572426, -0.0013988580321893096, -0.0013606470311060548, -0.0013224360300228, -0.0012842250289395452, -0.0012460141442716122, -0.0012078030267730355, -0.0011695920256897807, -0.001131381024606526, -0.001093170139938593, -0.001054959138855338, -0.0010167481377720833, -0.0009785371366888285, -0.0009403261938132346, -0.0009021152509376407, -0.0008639042498543859, -0.000825693306978792, -0.0007874823058955371, -0.0007492713630199432, -0.0007110603619366884, -0.0006728493608534336, -0.0006346384179778397, -0.0005964274751022458, -0.000558216474018991, -0.0005200055311433971, -0.0004817945300601423, -0.0004435835871845484, -0.00040537258610129356, -0.0003671616141218692, -0.00032895064214244485, -0.0002907396701630205, -0.00025252869818359613, -0.00021431772620417178, -0.0001761067396728322, -0.00013789576769340783, -9.968479571398348e-05, -6.147380918264389e-05, -2.3262837203219533e-05, 1.4948134776204824e-05, 5.315911039360799e-05, 9.137008601101115e-05, 0.00012958106526639313, 0.00016779203724581748, 0.00020600300922524184, 0.0002442139957565814, 0.0002824249677360058, 0.00032063593971543014]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 4.0, 10.0, 7.0, 7.0, 12.0, 16.0, 26.0, 16.0, 27.0, 34.0, 23.0, 33.0, 31.0, 44.0, 45.0, 39.0, 34.0, 35.0, 40.0, 38.0, 38.0, 40.0, 32.0, 42.0, 34.0, 32.0, 26.0, 29.0, 21.0, 23.0, 18.0, 18.0, 22.0, 11.0, 17.0, 11.0, 18.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004457235336303711, -0.0004318300634622574, -0.0004179365932941437, -0.00040404312312602997, -0.00039014965295791626, -0.00037625618278980255, -0.00036236271262168884, -0.00034846924245357513, -0.0003345757722854614, -0.0003206823021173477, -0.000306788831949234, -0.0002928953617811203, -0.0002790018916130066, -0.0002651084214448929, -0.0002512149512767792, -0.00023732148110866547, -0.00022342801094055176, -0.00020953454077243805, -0.00019564107060432434, -0.00018174760043621063, -0.00016785413026809692, -0.00015396066009998322, -0.0001400671899318695, -0.0001261737197637558, -0.00011228024959564209, -9.838677942752838e-05, -8.449330925941467e-05, -7.059983909130096e-05, -5.6706368923187256e-05, -4.281289875507355e-05, -2.891942858695984e-05, -1.502595841884613e-05, -1.1324882507324219e-06, 1.2760981917381287e-05, 2.6654452085494995e-05, 4.0547922253608704e-05, 5.444139242172241e-05, 6.833486258983612e-05, 8.222833275794983e-05, 9.612180292606354e-05, 0.00011001527309417725, 0.00012390874326229095, 0.00013780221343040466, 0.00015169568359851837, 0.00016558915376663208, 0.0001794826239347458, 0.0001933760941028595, 0.0002072695642709732, 0.00022116303443908691, 0.00023505650460720062, 0.00024894997477531433, 0.00026284344494342804, 0.00027673691511154175, 0.00029063038527965546, 0.00030452385544776917, 0.0003184173256158829, 0.0003323107957839966, 0.0003462042659521103, 0.000360097736120224, 0.0003739912062883377, 0.0003878846764564514, 0.0004017781466245651, 0.00041567161679267883, 0.00042956508696079254, 0.00044345855712890625]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 14.0, 20.0, 9.0, 18.0, 22.0, 27.0, 26.0, 26.0, 41.0, 29.0, 36.0, 41.0, 41.0, 39.0, 45.0, 52.0, 40.0, 53.0, 42.0, 40.0, 30.0, 27.0, 34.0, 25.0, 29.0, 27.0, 20.0, 28.0, 14.0, 15.0, 12.0, 6.0, 7.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.439300537109375, -3.33563232421875, -3.231964111328125, -3.1282958984375, -3.024627685546875, -2.92095947265625, -2.817291259765625, -2.713623046875, -2.609954833984375, -2.50628662109375, -2.402618408203125, -2.2989501953125, -2.195281982421875, -2.09161376953125, -1.987945556640625, -1.88427734375, -1.780609130859375, -1.67694091796875, -1.573272705078125, -1.4696044921875, -1.365936279296875, -1.26226806640625, -1.158599853515625, -1.054931640625, -0.951263427734375, -0.84759521484375, -0.743927001953125, -0.6402587890625, -0.536590576171875, -0.43292236328125, -0.329254150390625, -0.2255859375, -0.121917724609375, -0.01824951171875, 0.085418701171875, 0.1890869140625, 0.292755126953125, 0.39642333984375, 0.500091552734375, 0.603759765625, 0.707427978515625, 0.81109619140625, 0.914764404296875, 1.0184326171875, 1.122100830078125, 1.22576904296875, 1.329437255859375, 1.43310546875, 1.536773681640625, 1.64044189453125, 1.744110107421875, 1.8477783203125, 1.951446533203125, 2.05511474609375, 2.158782958984375, 2.262451171875, 2.366119384765625, 2.46978759765625, 2.573455810546875, 2.6771240234375, 2.780792236328125, 2.88446044921875, 2.988128662109375, 3.091796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 17.0, 20.0, 26.0, 33.0, 52.0, 75.0, 122.0, 133.0, 216.0, 375.0, 481.0, 770.0, 1223.0, 2055.0, 3324.0, 5474.0, 9521.0, 17482.0, 34472.0, 75683.0, 189118.0, 378165.0, 182292.0, 73389.0, 33463.0, 16893.0, 9320.0, 5445.0, 3242.0, 1940.0, 1301.0, 823.0, 508.0, 322.0, 262.0, 150.0, 109.0, 75.0, 39.0, 39.0, 32.0, 29.0, 10.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.482421875, -2.410430908203125, -2.33843994140625, -2.266448974609375, -2.1944580078125, -2.122467041015625, -2.05047607421875, -1.978485107421875, -1.906494140625, -1.834503173828125, -1.76251220703125, -1.690521240234375, -1.6185302734375, -1.546539306640625, -1.47454833984375, -1.402557373046875, -1.33056640625, -1.258575439453125, -1.18658447265625, -1.114593505859375, -1.0426025390625, -0.970611572265625, -0.89862060546875, -0.826629638671875, -0.754638671875, -0.682647705078125, -0.61065673828125, -0.538665771484375, -0.4666748046875, -0.394683837890625, -0.32269287109375, -0.250701904296875, -0.1787109375, -0.106719970703125, -0.03472900390625, 0.037261962890625, 0.1092529296875, 0.181243896484375, 0.25323486328125, 0.325225830078125, 0.397216796875, 0.469207763671875, 0.54119873046875, 0.613189697265625, 0.6851806640625, 0.757171630859375, 0.82916259765625, 0.901153564453125, 0.97314453125, 1.045135498046875, 1.11712646484375, 1.189117431640625, 1.2611083984375, 1.333099365234375, 1.40509033203125, 1.477081298828125, 1.549072265625, 1.621063232421875, 1.69305419921875, 1.765045166015625, 1.8370361328125, 1.909027099609375, 1.98101806640625, 2.053009033203125, 2.125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 16.0, 19.0, 22.0, 29.0, 28.0, 29.0, 43.0, 35.0, 39.0, 37.0, 52.0, 77.0, 188.0, 1709.0, 200.0, 71.0, 58.0, 39.0, 43.0, 40.0, 31.0, 29.0, 28.0, 25.0, 17.0, 10.0, 20.0, 18.0, 9.0, 11.0, 5.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.640625, -12.2403564453125, -11.840087890625, -11.4398193359375, -11.03955078125, -10.6392822265625, -10.239013671875, -9.8387451171875, -9.4384765625, -9.0382080078125, -8.637939453125, -8.2376708984375, -7.83740234375, -7.4371337890625, -7.036865234375, -6.6365966796875, -6.236328125, -5.8360595703125, -5.435791015625, -5.0355224609375, -4.63525390625, -4.2349853515625, -3.834716796875, -3.4344482421875, -3.0341796875, -2.6339111328125, -2.233642578125, -1.8333740234375, -1.43310546875, -1.0328369140625, -0.632568359375, -0.2322998046875, 0.16796875, 0.5682373046875, 0.968505859375, 1.3687744140625, 1.76904296875, 2.1693115234375, 2.569580078125, 2.9698486328125, 3.3701171875, 3.7703857421875, 4.170654296875, 4.5709228515625, 4.97119140625, 5.3714599609375, 5.771728515625, 6.1719970703125, 6.572265625, 6.9725341796875, 7.372802734375, 7.7730712890625, 8.17333984375, 8.5736083984375, 8.973876953125, 9.3741455078125, 9.7744140625, 10.1746826171875, 10.574951171875, 10.9752197265625, 11.37548828125, 11.7757568359375, 12.176025390625, 12.5762939453125, 12.9765625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 5.0, 3.0, 6.0, 5.0, 15.0, 12.0, 16.0, 24.0, 25.0, 29.0, 32.0, 38.0, 65.0, 84.0, 113.0, 245.0, 447.0, 1389.0, 13595.0, 2611454.0, 508394.0, 7566.0, 1096.0, 350.0, 193.0, 130.0, 75.0, 55.0, 51.0, 43.0, 28.0, 20.0, 18.0, 17.0, 14.0, 11.0, 7.0, 12.0, 9.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.281005859375, -19.62451171875, -18.968017578125, -18.3115234375, -17.655029296875, -16.99853515625, -16.342041015625, -15.685546875, -15.029052734375, -14.37255859375, -13.716064453125, -13.0595703125, -12.403076171875, -11.74658203125, -11.090087890625, -10.43359375, -9.777099609375, -9.12060546875, -8.464111328125, -7.8076171875, -7.151123046875, -6.49462890625, -5.838134765625, -5.181640625, -4.525146484375, -3.86865234375, -3.212158203125, -2.5556640625, -1.899169921875, -1.24267578125, -0.586181640625, 0.0703125, 0.726806640625, 1.38330078125, 2.039794921875, 2.6962890625, 3.352783203125, 4.00927734375, 4.665771484375, 5.322265625, 5.978759765625, 6.63525390625, 7.291748046875, 7.9482421875, 8.604736328125, 9.26123046875, 9.917724609375, 10.57421875, 11.230712890625, 11.88720703125, 12.543701171875, 13.2001953125, 13.856689453125, 14.51318359375, 15.169677734375, 15.826171875, 16.482666015625, 17.13916015625, 17.795654296875, 18.4521484375, 19.108642578125, 19.76513671875, 20.421630859375, 21.078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 62.0, 953.0, 3.0, 0.0, 1.0], "bins": [-456.1365051269531, -448.56988525390625, -441.0032958984375, -433.4366760253906, -425.87005615234375, -418.303466796875, -410.7368469238281, -403.17022705078125, -395.6036376953125, -388.0370178222656, -380.4704284667969, -372.90380859375, -365.3371887207031, -357.77056884765625, -350.2039794921875, -342.6373596191406, -335.07073974609375, -327.5041198730469, -319.9375305175781, -312.37091064453125, -304.8042907714844, -297.2376708984375, -289.67108154296875, -282.1044616699219, -274.537841796875, -266.9712219238281, -259.4046325683594, -251.8380126953125, -244.27139282226562, -236.7047882080078, -229.13818359375, -221.57156372070312, -214.00497436523438, -206.43836975097656, -198.8717498779297, -191.30514526367188, -183.738525390625, -176.1719207763672, -168.60531616210938, -161.0386962890625, -153.4720916748047, -145.90548706054688, -138.3388671875, -130.7722625732422, -123.20565032958984, -115.6390380859375, -108.07243347167969, -100.50582122802734, -92.939208984375, -85.37259674072266, -77.80598449707031, -70.2393798828125, -62.672767639160156, -55.10615539550781, -47.539546966552734, -39.972938537597656, -32.40632629394531, -24.8397159576416, -17.27310562133789, -9.70649528503418, -2.1398849487304688, 5.426727294921875, 12.993335723876953, 20.55994415283203, 28.126558303833008]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 7.0, 15.0, 8.0, 17.0, 12.0, 22.0, 14.0, 31.0, 22.0, 34.0, 26.0, 39.0, 35.0, 39.0, 36.0, 31.0, 46.0, 41.0, 49.0, 45.0, 44.0, 40.0, 40.0, 34.0, 31.0, 35.0, 33.0, 26.0, 23.0, 22.0, 20.0, 13.0, 11.0, 13.0, 3.0, 7.0, 7.0, 10.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.53909683227539, -33.306514739990234, -32.07393264770508, -30.841350555419922, -29.608768463134766, -28.37618637084961, -27.143606185913086, -25.91102409362793, -24.678442001342773, -23.445859909057617, -22.21327781677246, -20.980695724487305, -19.74811553955078, -18.515533447265625, -17.28295135498047, -16.050369262695312, -14.817787170410156, -13.585205078125, -12.352622985839844, -11.120041847229004, -9.887459754943848, -8.654877662658691, -7.422296047210693, -6.189714431762695, -4.957132339477539, -3.724550485610962, -2.4919686317443848, -1.2593867778778076, -0.02680492401123047, 1.2057771682739258, 2.438358783721924, 3.670940399169922, 4.9035186767578125, 6.136100769042969, 7.368682384490967, 8.601263999938965, 9.833846092224121, 11.066428184509277, 12.299009323120117, 13.531591415405273, 14.76417350769043, 15.996755599975586, 17.229337692260742, 18.4619197845459, 19.694499969482422, 20.927082061767578, 22.159664154052734, 23.39224624633789, 24.624828338623047, 25.857410430908203, 27.08999252319336, 28.322574615478516, 29.555156707763672, 30.787738800048828, 32.020320892333984, 33.252899169921875, 34.48548126220703, 35.71806335449219, 36.950645446777344, 38.1832275390625, 39.415809631347656, 40.64839172363281, 41.88097381591797, 43.113555908203125, 44.34613800048828]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 8.0, 13.0, 9.0, 6.0, 23.0, 15.0, 16.0, 18.0, 20.0, 23.0, 28.0, 32.0, 29.0, 39.0, 37.0, 38.0, 39.0, 47.0, 44.0, 42.0, 59.0, 39.0, 33.0, 40.0, 40.0, 30.0, 26.0, 20.0, 32.0, 33.0, 21.0, 16.0, 17.0, 16.0, 9.0, 12.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.4522705078125, -3.343994140625, -3.2357177734375, -3.12744140625, -3.0191650390625, -2.910888671875, -2.8026123046875, -2.6943359375, -2.5860595703125, -2.477783203125, -2.3695068359375, -2.26123046875, -2.1529541015625, -2.044677734375, -1.9364013671875, -1.828125, -1.7198486328125, -1.611572265625, -1.5032958984375, -1.39501953125, -1.2867431640625, -1.178466796875, -1.0701904296875, -0.9619140625, -0.8536376953125, -0.745361328125, -0.6370849609375, -0.52880859375, -0.4205322265625, -0.312255859375, -0.2039794921875, -0.095703125, 0.0125732421875, 0.120849609375, 0.2291259765625, 0.33740234375, 0.4456787109375, 0.553955078125, 0.6622314453125, 0.7705078125, 0.8787841796875, 0.987060546875, 1.0953369140625, 1.20361328125, 1.3118896484375, 1.420166015625, 1.5284423828125, 1.63671875, 1.7449951171875, 1.853271484375, 1.9615478515625, 2.06982421875, 2.1781005859375, 2.286376953125, 2.3946533203125, 2.5029296875, 2.6112060546875, 2.719482421875, 2.8277587890625, 2.93603515625, 3.0443115234375, 3.152587890625, 3.2608642578125, 3.369140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 10.0, 7.0, 5.0, 10.0, 13.0, 16.0, 18.0, 21.0, 13.0, 14.0, 27.0, 30.0, 29.0, 54.0, 85.0, 137.0, 315.0, 1414.0, 15721.0, 503418.0, 3510550.0, 153821.0, 7042.0, 805.0, 243.0, 106.0, 59.0, 42.0, 36.0, 28.0, 20.0, 33.0, 20.0, 18.0, 24.0, 15.0, 12.0, 6.0, 11.0, 6.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-19.03125, -18.477294921875, -17.92333984375, -17.369384765625, -16.8154296875, -16.261474609375, -15.70751953125, -15.153564453125, -14.599609375, -14.045654296875, -13.49169921875, -12.937744140625, -12.3837890625, -11.829833984375, -11.27587890625, -10.721923828125, -10.16796875, -9.614013671875, -9.06005859375, -8.506103515625, -7.9521484375, -7.398193359375, -6.84423828125, -6.290283203125, -5.736328125, -5.182373046875, -4.62841796875, -4.074462890625, -3.5205078125, -2.966552734375, -2.41259765625, -1.858642578125, -1.3046875, -0.750732421875, -0.19677734375, 0.357177734375, 0.9111328125, 1.465087890625, 2.01904296875, 2.572998046875, 3.126953125, 3.680908203125, 4.23486328125, 4.788818359375, 5.3427734375, 5.896728515625, 6.45068359375, 7.004638671875, 7.55859375, 8.112548828125, 8.66650390625, 9.220458984375, 9.7744140625, 10.328369140625, 10.88232421875, 11.436279296875, 11.990234375, 12.544189453125, 13.09814453125, 13.652099609375, 14.2060546875, 14.760009765625, 15.31396484375, 15.867919921875, 16.421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 17.0, 20.0, 37.0, 37.0, 58.0, 77.0, 119.0, 165.0, 224.0, 315.0, 423.0, 504.0, 510.0, 443.0, 333.0, 242.0, 176.0, 107.0, 87.0, 64.0, 35.0, 17.0, 10.0, 10.0, 13.0, 7.0, 6.0, 3.0, 5.0, 1.0], "bins": [-17.875, -17.48712158203125, -17.0992431640625, -16.71136474609375, -16.323486328125, -15.93560791015625, -15.5477294921875, -15.15985107421875, -14.77197265625, -14.38409423828125, -13.9962158203125, -13.60833740234375, -13.220458984375, -12.83258056640625, -12.4447021484375, -12.05682373046875, -11.6689453125, -11.28106689453125, -10.8931884765625, -10.50531005859375, -10.117431640625, -9.72955322265625, -9.3416748046875, -8.95379638671875, -8.56591796875, -8.17803955078125, -7.7901611328125, -7.40228271484375, -7.014404296875, -6.62652587890625, -6.2386474609375, -5.85076904296875, -5.462890625, -5.07501220703125, -4.6871337890625, -4.29925537109375, -3.911376953125, -3.52349853515625, -3.1356201171875, -2.74774169921875, -2.35986328125, -1.97198486328125, -1.5841064453125, -1.19622802734375, -0.808349609375, -0.42047119140625, -0.0325927734375, 0.35528564453125, 0.7431640625, 1.13104248046875, 1.5189208984375, 1.90679931640625, 2.294677734375, 2.68255615234375, 3.0704345703125, 3.45831298828125, 3.84619140625, 4.23406982421875, 4.6219482421875, 5.00982666015625, 5.397705078125, 5.78558349609375, 6.1734619140625, 6.56134033203125, 6.94921875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 13.0, 11.0, 10.0, 24.0, 39.0, 35.0, 59.0, 81.0, 174.0, 317.0, 635.0, 2402.0, 90552.0, 3970264.0, 125268.0, 2830.0, 696.0, 321.0, 183.0, 132.0, 71.0, 60.0, 34.0, 27.0, 18.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.21875, -40.8359375, -39.453125, -38.0703125, -36.6875, -35.3046875, -33.921875, -32.5390625, -31.15625, -29.7734375, -28.390625, -27.0078125, -25.625, -24.2421875, -22.859375, -21.4765625, -20.09375, -18.7109375, -17.328125, -15.9453125, -14.5625, -13.1796875, -11.796875, -10.4140625, -9.03125, -7.6484375, -6.265625, -4.8828125, -3.5, -2.1171875, -0.734375, 0.6484375, 2.03125, 3.4140625, 4.796875, 6.1796875, 7.5625, 8.9453125, 10.328125, 11.7109375, 13.09375, 14.4765625, 15.859375, 17.2421875, 18.625, 20.0078125, 21.390625, 22.7734375, 24.15625, 25.5390625, 26.921875, 28.3046875, 29.6875, 31.0703125, 32.453125, 33.8359375, 35.21875, 36.6015625, 37.984375, 39.3671875, 40.75, 42.1328125, 43.515625, 44.8984375, 46.28125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 88.0, 254.0, 372.0, 208.0, 62.0, 15.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.20643615722656, -55.73166275024414, -51.25688934326172, -46.7821159362793, -42.307342529296875, -37.83256912231445, -33.35779571533203, -28.88302230834961, -24.408248901367188, -19.933475494384766, -15.458702087402344, -10.983928680419922, -6.5091552734375, -2.034381866455078, 2.4403915405273438, 6.915164947509766, 11.389938354492188, 15.86471176147461, 20.33948516845703, 24.814258575439453, 29.289031982421875, 33.7638053894043, 38.23857879638672, 42.71335220336914, 47.18812561035156, 51.662899017333984, 56.137672424316406, 60.61244583129883, 65.08721923828125, 69.56199645996094, 74.0367660522461, 78.51153564453125, 82.98631286621094, 87.46109008789062, 91.93585968017578, 96.41062927246094, 100.88540649414062, 105.36018371582031, 109.83495330810547, 114.30972290039062, 118.78450012207031, 123.25927734375, 127.73404693603516, 132.2088165283203, 136.68359375, 141.1583709716797, 145.63314819335938, 150.10791015625, 154.5826873779297, 159.05746459960938, 163.5322265625, 168.0070037841797, 172.48178100585938, 176.95655822753906, 181.43133544921875, 185.90609741210938, 190.38087463378906, 194.85565185546875, 199.33041381835938, 203.80519104003906, 208.27996826171875, 212.75474548339844, 217.22952270507812, 221.70428466796875, 226.17906188964844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 12.0, 8.0, 15.0, 15.0, 15.0, 20.0, 18.0, 19.0, 19.0, 20.0, 22.0, 24.0, 43.0, 30.0, 22.0, 38.0, 42.0, 33.0, 31.0, 48.0, 31.0, 40.0, 34.0, 40.0, 34.0, 32.0, 30.0, 29.0, 21.0, 15.0, 23.0, 17.0, 15.0, 18.0, 14.0, 19.0, 12.0, 11.0, 7.0, 9.0, 7.0, 4.0, 6.0, 9.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0], "bins": [-35.346435546875, -34.28113555908203, -33.21583557128906, -32.15053939819336, -31.08523941040039, -30.019939422607422, -28.954641342163086, -27.88934326171875, -26.82404327392578, -25.758743286132812, -24.693445205688477, -23.62814712524414, -22.562847137451172, -21.497547149658203, -20.432249069213867, -19.36695098876953, -18.301651000976562, -17.236351013183594, -16.171052932739258, -15.105753898620605, -14.040454864501953, -12.9751558303833, -11.909856796264648, -10.844557762145996, -9.779258728027344, -8.713959693908691, -7.648660659790039, -6.583361625671387, -5.518062591552734, -4.452763557434082, -3.3874645233154297, -2.3221654891967773, -1.256866455078125, -0.19156742095947266, 0.8737316131591797, 1.939030647277832, 3.0043296813964844, 4.069628715515137, 5.134927749633789, 6.200226783752441, 7.265525817871094, 8.330824851989746, 9.396123886108398, 10.46142292022705, 11.526721954345703, 12.592020988464355, 13.657320022583008, 14.72261905670166, 15.787918090820312, 16.85321807861328, 17.918516159057617, 18.983814239501953, 20.049114227294922, 21.11441421508789, 22.179712295532227, 23.245010375976562, 24.31031036376953, 25.3756103515625, 26.440908432006836, 27.506206512451172, 28.57150650024414, 29.63680648803711, 30.702104568481445, 31.76740264892578, 32.83270263671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 9.0, 9.0, 17.0, 14.0, 13.0, 19.0, 28.0, 31.0, 32.0, 23.0, 28.0, 31.0, 34.0, 47.0, 41.0, 46.0, 40.0, 54.0, 42.0, 46.0, 36.0, 36.0, 37.0, 28.0, 32.0, 29.0, 36.0, 21.0, 25.0, 21.0, 15.0, 12.0, 13.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.11993408203125, -4.0054931640625, -3.89105224609375, -3.776611328125, -3.66217041015625, -3.5477294921875, -3.43328857421875, -3.31884765625, -3.20440673828125, -3.0899658203125, -2.97552490234375, -2.861083984375, -2.74664306640625, -2.6322021484375, -2.51776123046875, -2.4033203125, -2.28887939453125, -2.1744384765625, -2.05999755859375, -1.945556640625, -1.83111572265625, -1.7166748046875, -1.60223388671875, -1.48779296875, -1.37335205078125, -1.2589111328125, -1.14447021484375, -1.030029296875, -0.91558837890625, -0.8011474609375, -0.68670654296875, -0.572265625, -0.45782470703125, -0.3433837890625, -0.22894287109375, -0.114501953125, -6.103515625e-05, 0.1143798828125, 0.22882080078125, 0.34326171875, 0.45770263671875, 0.5721435546875, 0.68658447265625, 0.801025390625, 0.91546630859375, 1.0299072265625, 1.14434814453125, 1.2587890625, 1.37322998046875, 1.4876708984375, 1.60211181640625, 1.716552734375, 1.83099365234375, 1.9454345703125, 2.05987548828125, 2.17431640625, 2.28875732421875, 2.4031982421875, 2.51763916015625, 2.632080078125, 2.74652099609375, 2.8609619140625, 2.97540283203125, 3.08984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 13.0, 24.0, 33.0, 57.0, 57.0, 102.0, 123.0, 228.0, 303.0, 428.0, 641.0, 887.0, 1366.0, 1925.0, 2928.0, 4086.0, 5966.0, 9002.0, 13419.0, 20235.0, 31620.0, 50999.0, 83689.0, 134134.0, 186031.0, 175545.0, 120487.0, 74158.0, 45512.0, 28408.0, 18418.0, 12260.0, 8067.0, 5440.0, 3664.0, 2508.0, 1860.0, 1248.0, 856.0, 588.0, 370.0, 271.0, 194.0, 132.0, 87.0, 71.0, 40.0, 35.0, 12.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.3515625, -0.3408699035644531, -0.33017730712890625, -0.3194847106933594, -0.3087921142578125, -0.2980995178222656, -0.28740692138671875, -0.2767143249511719, -0.266021728515625, -0.2553291320800781, -0.24463653564453125, -0.23394393920898438, -0.2232513427734375, -0.21255874633789062, -0.20186614990234375, -0.19117355346679688, -0.18048095703125, -0.16978836059570312, -0.15909576416015625, -0.14840316772460938, -0.1377105712890625, -0.12701797485351562, -0.11632537841796875, -0.10563278198242188, -0.094940185546875, -0.08424758911132812, -0.07355499267578125, -0.06286239624023438, -0.0521697998046875, -0.041477203369140625, -0.03078460693359375, -0.020092010498046875, -0.0093994140625, 0.001293182373046875, 0.01198577880859375, 0.022678375244140625, 0.0333709716796875, 0.044063568115234375, 0.05475616455078125, 0.06544876098632812, 0.076141357421875, 0.08683395385742188, 0.09752655029296875, 0.10821914672851562, 0.1189117431640625, 0.12960433959960938, 0.14029693603515625, 0.15098953247070312, 0.16168212890625, 0.17237472534179688, 0.18306732177734375, 0.19375991821289062, 0.2044525146484375, 0.21514511108398438, 0.22583770751953125, 0.23653030395507812, 0.247222900390625, 0.2579154968261719, 0.26860809326171875, 0.2793006896972656, 0.2899932861328125, 0.3006858825683594, 0.31137847900390625, 0.3220710754394531, 0.332763671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 5.0, 5.0, 6.0, 3.0, 9.0, 8.0, 11.0, 14.0, 13.0, 16.0, 25.0, 19.0, 29.0, 38.0, 19.0, 22.0, 42.0, 28.0, 37.0, 38.0, 32.0, 30.0, 1069.0, 36.0, 29.0, 38.0, 40.0, 35.0, 18.0, 20.0, 36.0, 31.0, 26.0, 29.0, 20.0, 17.0, 21.0, 15.0, 16.0, 10.0, 12.0, 5.0, 5.0, 11.0, 4.0, 8.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.984375, -1.920135498046875, -1.85589599609375, -1.791656494140625, -1.7274169921875, -1.663177490234375, -1.59893798828125, -1.534698486328125, -1.470458984375, -1.406219482421875, -1.34197998046875, -1.277740478515625, -1.2135009765625, -1.149261474609375, -1.08502197265625, -1.020782470703125, -0.95654296875, -0.892303466796875, -0.82806396484375, -0.763824462890625, -0.6995849609375, -0.635345458984375, -0.57110595703125, -0.506866455078125, -0.442626953125, -0.378387451171875, -0.31414794921875, -0.249908447265625, -0.1856689453125, -0.121429443359375, -0.05718994140625, 0.007049560546875, 0.0712890625, 0.135528564453125, 0.19976806640625, 0.264007568359375, 0.3282470703125, 0.392486572265625, 0.45672607421875, 0.520965576171875, 0.585205078125, 0.649444580078125, 0.71368408203125, 0.777923583984375, 0.8421630859375, 0.906402587890625, 0.97064208984375, 1.034881591796875, 1.09912109375, 1.163360595703125, 1.22760009765625, 1.291839599609375, 1.3560791015625, 1.420318603515625, 1.48455810546875, 1.548797607421875, 1.613037109375, 1.677276611328125, 1.74151611328125, 1.805755615234375, 1.8699951171875, 1.934234619140625, 1.99847412109375, 2.062713623046875, 2.126953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 17.0, 23.0, 41.0, 43.0, 63.0, 106.0, 143.0, 238.0, 309.0, 437.0, 732.0, 1154.0, 1770.0, 2750.0, 4485.0, 7443.0, 11963.0, 19683.0, 33267.0, 56020.0, 93002.0, 145683.0, 1234483.0, 173181.0, 121877.0, 75213.0, 44619.0, 26718.0, 15978.0, 9626.0, 6023.0, 3605.0, 2288.0, 1452.0, 934.0, 586.0, 405.0, 234.0, 169.0, 122.0, 76.0, 45.0, 34.0, 21.0, 21.0, 9.0, 11.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.26123046875, -0.2521553039550781, -0.24308013916015625, -0.23400497436523438, -0.2249298095703125, -0.21585464477539062, -0.20677947998046875, -0.19770431518554688, -0.188629150390625, -0.17955398559570312, -0.17047882080078125, -0.16140365600585938, -0.1523284912109375, -0.14325332641601562, -0.13417816162109375, -0.12510299682617188, -0.11602783203125, -0.10695266723632812, -0.09787750244140625, -0.08880233764648438, -0.0797271728515625, -0.07065200805664062, -0.06157684326171875, -0.052501678466796875, -0.043426513671875, -0.034351348876953125, -0.02527618408203125, -0.016201019287109375, -0.0071258544921875, 0.001949310302734375, 0.01102447509765625, 0.020099639892578125, 0.0291748046875, 0.038249969482421875, 0.04732513427734375, 0.056400299072265625, 0.0654754638671875, 0.07455062866210938, 0.08362579345703125, 0.09270095825195312, 0.101776123046875, 0.11085128784179688, 0.11992645263671875, 0.12900161743164062, 0.1380767822265625, 0.14715194702148438, 0.15622711181640625, 0.16530227661132812, 0.17437744140625, 0.18345260620117188, 0.19252777099609375, 0.20160293579101562, 0.2106781005859375, 0.21975326538085938, 0.22882843017578125, 0.23790359497070312, 0.246978759765625, 0.2560539245605469, 0.26512908935546875, 0.2742042541503906, 0.2832794189453125, 0.2923545837402344, 0.30142974853515625, 0.3105049133300781, 0.319580078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 15.0, 7.0, 13.0, 18.0, 17.0, 22.0, 17.0, 25.0, 28.0, 34.0, 31.0, 28.0, 50.0, 45.0, 49.0, 39.0, 61.0, 43.0, 47.0, 49.0, 35.0, 41.0, 33.0, 28.0, 31.0, 27.0, 22.0, 23.0, 28.0, 17.0, 13.0, 12.0, 7.0, 7.0, 4.0, 8.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0008392333984375, -0.0008132904767990112, -0.0007873475551605225, -0.0007614046335220337, -0.0007354617118835449, -0.0007095187902450562, -0.0006835758686065674, -0.0006576329469680786, -0.0006316900253295898, -0.0006057471036911011, -0.0005798041820526123, -0.0005538612604141235, -0.0005279183387756348, -0.000501975417137146, -0.0004760324954986572, -0.00045008957386016846, -0.0004241466522216797, -0.0003982037305831909, -0.00037226080894470215, -0.0003463178873062134, -0.0003203749656677246, -0.00029443204402923584, -0.00026848912239074707, -0.0002425462007522583, -0.00021660327911376953, -0.00019066035747528076, -0.000164717435836792, -0.00013877451419830322, -0.00011283159255981445, -8.688867092132568e-05, -6.0945749282836914e-05, -3.5002827644348145e-05, -9.059906005859375e-06, 1.6883015632629395e-05, 4.2825937271118164e-05, 6.876885890960693e-05, 9.47117805480957e-05, 0.00012065470218658447, 0.00014659762382507324, 0.000172540545463562, 0.00019848346710205078, 0.00022442638874053955, 0.0002503693103790283, 0.0002763122320175171, 0.00030225515365600586, 0.00032819807529449463, 0.0003541409969329834, 0.00038008391857147217, 0.00040602684020996094, 0.0004319697618484497, 0.0004579126834869385, 0.00048385560512542725, 0.000509798526763916, 0.0005357414484024048, 0.0005616843700408936, 0.0005876272916793823, 0.0006135702133178711, 0.0006395131349563599, 0.0006654560565948486, 0.0006913989782333374, 0.0007173418998718262, 0.0007432848215103149, 0.0007692277431488037, 0.0007951706647872925, 0.0008211135864257812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 8.0, 10.0, 16.0, 18.0, 31.0, 26.0, 25.0, 51.0, 63.0, 62.0, 120.0, 132.0, 183.0, 276.0, 445.0, 2024.0, 381307.0, 659019.0, 3157.0, 511.0, 279.0, 139.0, 147.0, 102.0, 99.0, 68.0, 43.0, 41.0, 37.0, 25.0, 22.0, 15.0, 10.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171966552734375, -0.016643047332763672, -0.016089439392089844, -0.015535831451416016, -0.014982223510742188, -0.01442861557006836, -0.013875007629394531, -0.013321399688720703, -0.012767791748046875, -0.012214183807373047, -0.011660575866699219, -0.01110696792602539, -0.010553359985351562, -0.009999752044677734, -0.009446144104003906, -0.008892536163330078, -0.00833892822265625, -0.007785320281982422, -0.007231712341308594, -0.006678104400634766, -0.0061244964599609375, -0.005570888519287109, -0.005017280578613281, -0.004463672637939453, -0.003910064697265625, -0.003356456756591797, -0.0028028488159179688, -0.0022492408752441406, -0.0016956329345703125, -0.0011420249938964844, -0.0005884170532226562, -3.4809112548828125e-05, 0.000518798828125, 0.0010724067687988281, 0.0016260147094726562, 0.0021796226501464844, 0.0027332305908203125, 0.0032868385314941406, 0.0038404464721679688, 0.004394054412841797, 0.004947662353515625, 0.005501270294189453, 0.006054878234863281, 0.006608486175537109, 0.0071620941162109375, 0.007715702056884766, 0.008269309997558594, 0.008822917938232422, 0.00937652587890625, 0.009930133819580078, 0.010483741760253906, 0.011037349700927734, 0.011590957641601562, 0.01214456558227539, 0.012698173522949219, 0.013251781463623047, 0.013805389404296875, 0.014358997344970703, 0.014912605285644531, 0.01546621322631836, 0.016019821166992188, 0.016573429107666016, 0.017127037048339844, 0.017680644989013672, 0.0182342529296875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 111.0, 634.0, 245.0, 18.0, 3.0, 1.0], "bins": [-0.008335847407579422, -0.008196127600967884, -0.008056406863033772, -0.007916687056422234, -0.007776966784149408, -0.007637246511876583, -0.007497526705265045, -0.00735780643299222, -0.007218086160719395, -0.0070783658884465694, -0.006938645616173744, -0.006798925809562206, -0.006659205537289381, -0.006519485265016556, -0.006379765458405018, -0.006240045186132193, -0.006100324913859367, -0.005960604641586542, -0.005820884369313717, -0.005681164562702179, -0.005541444290429354, -0.0054017240181565285, -0.0052620042115449905, -0.005122283939272165, -0.00498256366699934, -0.004842843394726515, -0.00470312312245369, -0.004563403315842152, -0.004423683043569326, -0.004283962771296501, -0.004144242964684963, -0.004004522692412138, -0.0038648024201393127, -0.0037250821478664875, -0.003585362108424306, -0.0034456420689821243, -0.003305921796709299, -0.003166201524436474, -0.0030264814849942923, -0.0028867614455521107, -0.0027470411732792854, -0.00260732090100646, -0.0024676008615642786, -0.002327880822122097, -0.0021881605498492718, -0.0020484402775764465, -0.001908720238134265, -0.0017690000822767615, -0.00162928004283458, -0.0014895598869770765, -0.0013498397311195731, -0.0012101195752620697, -0.0010703994194045663, -0.0009306792635470629, -0.0007909591076895595, -0.000651238951832056, -0.0005115187959745526, -0.0003717986401170492, -0.0002320784842595458, -9.235832840204239e-05, 4.7361827455461025e-05, 0.00018708198331296444, 0.00032680213917046785, 0.00046652229502797127, 0.0006062424508854747]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 4.0, 13.0, 11.0, 6.0, 10.0, 9.0, 24.0, 27.0, 23.0, 23.0, 33.0, 35.0, 46.0, 33.0, 39.0, 41.0, 30.0, 37.0, 49.0, 50.0, 45.0, 30.0, 32.0, 47.0, 38.0, 33.0, 29.0, 32.0, 30.0, 20.0, 21.0, 20.0, 14.0, 13.0, 15.0, 5.0, 4.0, 5.0, 8.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0005630254745483398, -0.0005469545722007751, -0.0005308836698532104, -0.0005148127675056458, -0.0004987418651580811, -0.00048267096281051636, -0.00046660006046295166, -0.00045052915811538696, -0.00043445825576782227, -0.00041838735342025757, -0.00040231645107269287, -0.0003862455487251282, -0.0003701746463775635, -0.0003541037440299988, -0.0003380328416824341, -0.0003219619393348694, -0.0003058910369873047, -0.00028982013463974, -0.0002737492322921753, -0.0002576783299446106, -0.0002416074275970459, -0.0002255365252494812, -0.0002094656229019165, -0.0001933947205543518, -0.0001773238182067871, -0.0001612529158592224, -0.00014518201351165771, -0.00012911111116409302, -0.00011304020881652832, -9.696930646896362e-05, -8.089840412139893e-05, -6.482750177383423e-05, -4.875659942626953e-05, -3.2685697078704834e-05, -1.6614794731140137e-05, -5.438923835754395e-07, 1.5527009963989258e-05, 3.1597912311553955e-05, 4.766881465911865e-05, 6.373971700668335e-05, 7.981061935424805e-05, 9.588152170181274e-05, 0.00011195242404937744, 0.00012802332639694214, 0.00014409422874450684, 0.00016016513109207153, 0.00017623603343963623, 0.00019230693578720093, 0.00020837783813476562, 0.00022444874048233032, 0.00024051964282989502, 0.0002565905451774597, 0.0002726614475250244, 0.0002887323498725891, 0.0003048032522201538, 0.0003208741545677185, 0.0003369450569152832, 0.0003530159592628479, 0.0003690868616104126, 0.0003851577639579773, 0.000401228666305542, 0.0004172995686531067, 0.0004333704710006714, 0.0004494413733482361, 0.0004655122756958008]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 9.0, 9.0, 17.0, 14.0, 13.0, 19.0, 28.0, 31.0, 32.0, 23.0, 28.0, 31.0, 33.0, 48.0, 41.0, 46.0, 40.0, 54.0, 42.0, 46.0, 36.0, 36.0, 37.0, 28.0, 32.0, 29.0, 36.0, 21.0, 25.0, 21.0, 15.0, 12.0, 13.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.11993408203125, -4.0054931640625, -3.89105224609375, -3.776611328125, -3.66217041015625, -3.5477294921875, -3.43328857421875, -3.31884765625, -3.20440673828125, -3.0899658203125, -2.97552490234375, -2.861083984375, -2.74664306640625, -2.6322021484375, -2.51776123046875, -2.4033203125, -2.28887939453125, -2.1744384765625, -2.05999755859375, -1.945556640625, -1.83111572265625, -1.7166748046875, -1.60223388671875, -1.48779296875, -1.37335205078125, -1.2589111328125, -1.14447021484375, -1.030029296875, -0.91558837890625, -0.8011474609375, -0.68670654296875, -0.572265625, -0.45782470703125, -0.3433837890625, -0.22894287109375, -0.114501953125, -6.103515625e-05, 0.1143798828125, 0.22882080078125, 0.34326171875, 0.45770263671875, 0.5721435546875, 0.68658447265625, 0.801025390625, 0.91546630859375, 1.0299072265625, 1.14434814453125, 1.2587890625, 1.37322998046875, 1.4876708984375, 1.60211181640625, 1.716552734375, 1.83099365234375, 1.9454345703125, 2.05987548828125, 2.17431640625, 2.28875732421875, 2.4031982421875, 2.51763916015625, 2.632080078125, 2.74652099609375, 2.8609619140625, 2.97540283203125, 3.08984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 5.0, 11.0, 16.0, 22.0, 34.0, 38.0, 63.0, 88.0, 128.0, 229.0, 348.0, 509.0, 832.0, 1487.0, 2750.0, 5526.0, 12331.0, 31732.0, 97724.0, 326635.0, 382716.0, 119720.0, 37749.0, 14082.0, 6208.0, 3176.0, 1697.0, 1014.0, 609.0, 371.0, 250.0, 159.0, 83.0, 63.0, 36.0, 29.0, 29.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.162109375, -3.0693359375, -2.9765625, -2.8837890625, -2.791015625, -2.6982421875, -2.60546875, -2.5126953125, -2.419921875, -2.3271484375, -2.234375, -2.1416015625, -2.048828125, -1.9560546875, -1.86328125, -1.7705078125, -1.677734375, -1.5849609375, -1.4921875, -1.3994140625, -1.306640625, -1.2138671875, -1.12109375, -1.0283203125, -0.935546875, -0.8427734375, -0.75, -0.6572265625, -0.564453125, -0.4716796875, -0.37890625, -0.2861328125, -0.193359375, -0.1005859375, -0.0078125, 0.0849609375, 0.177734375, 0.2705078125, 0.36328125, 0.4560546875, 0.548828125, 0.6416015625, 0.734375, 0.8271484375, 0.919921875, 1.0126953125, 1.10546875, 1.1982421875, 1.291015625, 1.3837890625, 1.4765625, 1.5693359375, 1.662109375, 1.7548828125, 1.84765625, 1.9404296875, 2.033203125, 2.1259765625, 2.21875, 2.3115234375, 2.404296875, 2.4970703125, 2.58984375, 2.6826171875, 2.775390625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 10.0, 8.0, 12.0, 23.0, 10.0, 26.0, 18.0, 23.0, 39.0, 29.0, 40.0, 49.0, 45.0, 36.0, 59.0, 133.0, 1713.0, 290.0, 86.0, 57.0, 50.0, 39.0, 43.0, 26.0, 33.0, 22.0, 27.0, 25.0, 20.0, 9.0, 12.0, 9.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1258544921875, -11.689208984375, -11.2525634765625, -10.81591796875, -10.3792724609375, -9.942626953125, -9.5059814453125, -9.0693359375, -8.6326904296875, -8.196044921875, -7.7593994140625, -7.32275390625, -6.8861083984375, -6.449462890625, -6.0128173828125, -5.576171875, -5.1395263671875, -4.702880859375, -4.2662353515625, -3.82958984375, -3.3929443359375, -2.956298828125, -2.5196533203125, -2.0830078125, -1.6463623046875, -1.209716796875, -0.7730712890625, -0.33642578125, 0.1002197265625, 0.536865234375, 0.9735107421875, 1.41015625, 1.8468017578125, 2.283447265625, 2.7200927734375, 3.15673828125, 3.5933837890625, 4.030029296875, 4.4666748046875, 4.9033203125, 5.3399658203125, 5.776611328125, 6.2132568359375, 6.64990234375, 7.0865478515625, 7.523193359375, 7.9598388671875, 8.396484375, 8.8331298828125, 9.269775390625, 9.7064208984375, 10.14306640625, 10.5797119140625, 11.016357421875, 11.4530029296875, 11.8896484375, 12.3262939453125, 12.762939453125, 13.1995849609375, 13.63623046875, 14.0728759765625, 14.509521484375, 14.9461669921875, 15.3828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 0.0, 6.0, 4.0, 8.0, 9.0, 13.0, 13.0, 25.0, 32.0, 40.0, 32.0, 54.0, 77.0, 102.0, 219.0, 481.0, 1403.0, 9895.0, 2662709.0, 462585.0, 5783.0, 1150.0, 417.0, 209.0, 111.0, 80.0, 54.0, 36.0, 30.0, 34.0, 18.0, 13.0, 18.0, 15.0, 8.0, 3.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.640625, -23.9345703125, -23.228515625, -22.5224609375, -21.81640625, -21.1103515625, -20.404296875, -19.6982421875, -18.9921875, -18.2861328125, -17.580078125, -16.8740234375, -16.16796875, -15.4619140625, -14.755859375, -14.0498046875, -13.34375, -12.6376953125, -11.931640625, -11.2255859375, -10.51953125, -9.8134765625, -9.107421875, -8.4013671875, -7.6953125, -6.9892578125, -6.283203125, -5.5771484375, -4.87109375, -4.1650390625, -3.458984375, -2.7529296875, -2.046875, -1.3408203125, -0.634765625, 0.0712890625, 0.77734375, 1.4833984375, 2.189453125, 2.8955078125, 3.6015625, 4.3076171875, 5.013671875, 5.7197265625, 6.42578125, 7.1318359375, 7.837890625, 8.5439453125, 9.25, 9.9560546875, 10.662109375, 11.3681640625, 12.07421875, 12.7802734375, 13.486328125, 14.1923828125, 14.8984375, 15.6044921875, 16.310546875, 17.0166015625, 17.72265625, 18.4287109375, 19.134765625, 19.8408203125, 20.546875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 77.0, 932.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.892574310302734, -7.472862243652344, -2.053150177001953, 3.3665618896484375, 8.786273956298828, 14.205986022949219, 19.62569808959961, 25.04541015625, 30.46512222290039, 35.88483428955078, 41.30454635620117, 46.72425842285156, 52.14397048950195, 57.563682556152344, 62.983394622802734, 68.40310668945312, 73.82281494140625, 79.24252319335938, 84.66223907470703, 90.08195495605469, 95.50166320800781, 100.92137145996094, 106.3410873413086, 111.76080322265625, 117.18051147460938, 122.6002197265625, 128.01992797851562, 133.4396514892578, 138.85935974121094, 144.27906799316406, 149.69879150390625, 155.11849975585938, 160.5382080078125, 165.95791625976562, 171.37762451171875, 176.79734802246094, 182.21705627441406, 187.6367645263672, 193.05648803710938, 198.4761962890625, 203.89590454101562, 209.31561279296875, 214.73532104492188, 220.15504455566406, 225.5747528076172, 230.9944610595703, 236.4141845703125, 241.83389282226562, 247.25360107421875, 252.67330932617188, 258.093017578125, 263.5127258300781, 268.93243408203125, 274.3521728515625, 279.7718811035156, 285.19158935546875, 290.6112976074219, 296.031005859375, 301.4507141113281, 306.87042236328125, 312.2901611328125, 317.7098693847656, 323.12957763671875, 328.5492858886719, 333.968994140625]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 4.0, 5.0, 12.0, 11.0, 12.0, 20.0, 16.0, 22.0, 24.0, 31.0, 28.0, 26.0, 31.0, 34.0, 39.0, 44.0, 44.0, 41.0, 39.0, 63.0, 33.0, 39.0, 47.0, 37.0, 25.0, 36.0, 20.0, 27.0, 26.0, 28.0, 23.0, 21.0, 23.0, 11.0, 17.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-43.85280227661133, -42.60800552368164, -41.36321258544922, -40.11841583251953, -38.87362289428711, -37.62882614135742, -36.384033203125, -35.13923645019531, -33.894439697265625, -32.64964294433594, -31.404850006103516, -30.160053253173828, -28.915258407592773, -27.67046356201172, -26.425668716430664, -25.18087387084961, -23.936079025268555, -22.6912841796875, -21.446489334106445, -20.20169448852539, -18.956897735595703, -17.71210289001465, -16.467308044433594, -15.222512245178223, -13.977717399597168, -12.732922554016113, -11.488126754760742, -10.243331909179688, -8.998537063598633, -7.753741264343262, -6.508946418762207, -5.264150619506836, -4.019355773925781, -2.7745604515075684, -1.5297653675079346, -0.2849702835083008, 0.9598250389099121, 2.204620361328125, 3.4494152069091797, 4.694211006164551, 5.9390058517456055, 7.183801174163818, 8.428596496582031, 9.673391342163086, 10.91818618774414, 12.162981986999512, 13.407776832580566, 14.652572631835938, 15.897367477416992, 17.142162322998047, 18.3869571685791, 19.631752014160156, 20.876548767089844, 22.1213436126709, 23.366138458251953, 24.61093521118164, 25.855728149414062, 27.100522994995117, 28.345317840576172, 29.59011459350586, 30.834909439086914, 32.07970428466797, 33.324501037597656, 34.56929397583008, 35.814090728759766]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 6.0, 8.0, 13.0, 8.0, 14.0, 19.0, 13.0, 26.0, 31.0, 28.0, 26.0, 31.0, 25.0, 35.0, 40.0, 31.0, 53.0, 43.0, 44.0, 49.0, 45.0, 46.0, 33.0, 40.0, 30.0, 34.0, 28.0, 28.0, 26.0, 28.0, 23.0, 17.0, 20.0, 12.0, 5.0, 7.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.25836181640625, -4.1417236328125, -4.02508544921875, -3.908447265625, -3.79180908203125, -3.6751708984375, -3.55853271484375, -3.44189453125, -3.32525634765625, -3.2086181640625, -3.09197998046875, -2.975341796875, -2.85870361328125, -2.7420654296875, -2.62542724609375, -2.5087890625, -2.39215087890625, -2.2755126953125, -2.15887451171875, -2.042236328125, -1.92559814453125, -1.8089599609375, -1.69232177734375, -1.57568359375, -1.45904541015625, -1.3424072265625, -1.22576904296875, -1.109130859375, -0.99249267578125, -0.8758544921875, -0.75921630859375, -0.642578125, -0.52593994140625, -0.4093017578125, -0.29266357421875, -0.176025390625, -0.05938720703125, 0.0572509765625, 0.17388916015625, 0.29052734375, 0.40716552734375, 0.5238037109375, 0.64044189453125, 0.757080078125, 0.87371826171875, 0.9903564453125, 1.10699462890625, 1.2236328125, 1.34027099609375, 1.4569091796875, 1.57354736328125, 1.690185546875, 1.80682373046875, 1.9234619140625, 2.04010009765625, 2.15673828125, 2.27337646484375, 2.3900146484375, 2.50665283203125, 2.623291015625, 2.73992919921875, 2.8565673828125, 2.97320556640625, 3.08984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 9.0, 14.0, 19.0, 24.0, 29.0, 48.0, 57.0, 92.0, 188.0, 310.0, 656.0, 1799.0, 6148.0, 24191.0, 118035.0, 845851.0, 2346026.0, 715651.0, 105228.0, 21384.0, 5510.0, 1644.0, 609.0, 291.0, 143.0, 94.0, 52.0, 33.0, 27.0, 31.0, 14.0, 13.0, 7.0, 10.0, 10.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.8515625, -9.59539794921875, -9.3392333984375, -9.08306884765625, -8.826904296875, -8.57073974609375, -8.3145751953125, -8.05841064453125, -7.80224609375, -7.54608154296875, -7.2899169921875, -7.03375244140625, -6.777587890625, -6.52142333984375, -6.2652587890625, -6.00909423828125, -5.7529296875, -5.49676513671875, -5.2406005859375, -4.98443603515625, -4.728271484375, -4.47210693359375, -4.2159423828125, -3.95977783203125, -3.70361328125, -3.44744873046875, -3.1912841796875, -2.93511962890625, -2.678955078125, -2.42279052734375, -2.1666259765625, -1.91046142578125, -1.654296875, -1.39813232421875, -1.1419677734375, -0.88580322265625, -0.629638671875, -0.37347412109375, -0.1173095703125, 0.13885498046875, 0.39501953125, 0.65118408203125, 0.9073486328125, 1.16351318359375, 1.419677734375, 1.67584228515625, 1.9320068359375, 2.18817138671875, 2.4443359375, 2.70050048828125, 2.9566650390625, 3.21282958984375, 3.468994140625, 3.72515869140625, 3.9813232421875, 4.23748779296875, 4.49365234375, 4.74981689453125, 5.0059814453125, 5.26214599609375, 5.518310546875, 5.77447509765625, 6.0306396484375, 6.28680419921875, 6.54296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 6.0, 4.0, 12.0, 22.0, 32.0, 28.0, 38.0, 81.0, 99.0, 165.0, 197.0, 303.0, 347.0, 432.0, 518.0, 483.0, 343.0, 264.0, 208.0, 137.0, 101.0, 82.0, 54.0, 39.0, 13.0, 18.0, 16.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.511962890625, -11.13330078125, -10.754638671875, -10.3759765625, -9.997314453125, -9.61865234375, -9.239990234375, -8.861328125, -8.482666015625, -8.10400390625, -7.725341796875, -7.3466796875, -6.968017578125, -6.58935546875, -6.210693359375, -5.83203125, -5.453369140625, -5.07470703125, -4.696044921875, -4.3173828125, -3.938720703125, -3.56005859375, -3.181396484375, -2.802734375, -2.424072265625, -2.04541015625, -1.666748046875, -1.2880859375, -0.909423828125, -0.53076171875, -0.152099609375, 0.2265625, 0.605224609375, 0.98388671875, 1.362548828125, 1.7412109375, 2.119873046875, 2.49853515625, 2.877197265625, 3.255859375, 3.634521484375, 4.01318359375, 4.391845703125, 4.7705078125, 5.149169921875, 5.52783203125, 5.906494140625, 6.28515625, 6.663818359375, 7.04248046875, 7.421142578125, 7.7998046875, 8.178466796875, 8.55712890625, 8.935791015625, 9.314453125, 9.693115234375, 10.07177734375, 10.450439453125, 10.8291015625, 11.207763671875, 11.58642578125, 11.965087890625, 12.34375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 9.0, 12.0, 10.0, 16.0, 27.0, 35.0, 41.0, 66.0, 118.0, 215.0, 438.0, 1467.0, 17892.0, 3077717.0, 1085786.0, 8502.0, 1066.0, 360.0, 189.0, 88.0, 75.0, 43.0, 41.0, 20.0, 15.0, 7.0, 7.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.50390625, -34.1328125, -32.76171875, -31.390625, -30.01953125, -28.6484375, -27.27734375, -25.90625, -24.53515625, -23.1640625, -21.79296875, -20.421875, -19.05078125, -17.6796875, -16.30859375, -14.9375, -13.56640625, -12.1953125, -10.82421875, -9.453125, -8.08203125, -6.7109375, -5.33984375, -3.96875, -2.59765625, -1.2265625, 0.14453125, 1.515625, 2.88671875, 4.2578125, 5.62890625, 7.0, 8.37109375, 9.7421875, 11.11328125, 12.484375, 13.85546875, 15.2265625, 16.59765625, 17.96875, 19.33984375, 20.7109375, 22.08203125, 23.453125, 24.82421875, 26.1953125, 27.56640625, 28.9375, 30.30859375, 31.6796875, 33.05078125, 34.421875, 35.79296875, 37.1640625, 38.53515625, 39.90625, 41.27734375, 42.6484375, 44.01953125, 45.390625, 46.76171875, 48.1328125, 49.50390625, 50.875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 54.0, 133.0, 294.0, 305.0, 150.0, 54.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-218.33181762695312, -214.36318969726562, -210.39456176757812, -206.4259490966797, -202.4573211669922, -198.4886932373047, -194.5200653076172, -190.55145263671875, -186.58282470703125, -182.61419677734375, -178.64556884765625, -174.6769561767578, -170.7083282470703, -166.7397003173828, -162.7710723876953, -158.80245971679688, -154.83383178710938, -150.86520385742188, -146.89657592773438, -142.92796325683594, -138.95933532714844, -134.99070739746094, -131.02207946777344, -127.05345916748047, -123.08483123779297, -119.11620330810547, -115.1475830078125, -111.178955078125, -107.21033477783203, -103.24170684814453, -99.27308654785156, -95.30445861816406, -91.33583068847656, -87.36720275878906, -83.3985824584961, -79.4299545288086, -75.46133422851562, -71.49270629882812, -67.52408599853516, -63.555458068847656, -59.58683776855469, -55.61821365356445, -51.64958953857422, -47.680965423583984, -43.71234130859375, -39.74371337890625, -35.77509307861328, -31.806467056274414, -27.837844848632812, -23.869220733642578, -19.900596618652344, -15.931971549987793, -11.963347434997559, -7.994722366333008, -4.026098251342773, -0.05747413635253906, 3.9111499786376953, 7.87977409362793, 11.848398208618164, 15.817023277282715, 19.785648345947266, 23.7542724609375, 27.722896575927734, 31.69152069091797, 35.6601448059082]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 12.0, 8.0, 12.0, 7.0, 13.0, 25.0, 17.0, 13.0, 15.0, 17.0, 21.0, 22.0, 35.0, 29.0, 34.0, 34.0, 24.0, 39.0, 27.0, 46.0, 39.0, 38.0, 38.0, 33.0, 31.0, 33.0, 34.0, 26.0, 28.0, 33.0, 21.0, 32.0, 24.0, 19.0, 16.0, 20.0, 18.0, 12.0, 10.0, 8.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-34.68035125732422, -33.65359878540039, -32.62684631347656, -31.600093841552734, -30.57334327697754, -29.54659080505371, -28.519838333129883, -27.493085861206055, -26.46633529663086, -25.43958282470703, -24.412830352783203, -23.386077880859375, -22.35932731628418, -21.33257484436035, -20.305822372436523, -19.279069900512695, -18.252317428588867, -17.22556495666504, -16.19881248474121, -15.1720609664917, -14.145309448242188, -13.11855697631836, -12.091804504394531, -11.065052032470703, -10.038300514221191, -9.011548042297363, -7.984796524047852, -6.958044052124023, -5.9312920570373535, -4.904540061950684, -3.8777875900268555, -2.8510355949401855, -1.8242835998535156, -0.7975314855575562, 0.22922062873840332, 1.2559728622436523, 2.2827248573303223, 3.309476852416992, 4.33622932434082, 5.36298131942749, 6.38973331451416, 7.41648530960083, 8.4432373046875, 9.469989776611328, 10.496742248535156, 11.523493766784668, 12.550246238708496, 13.576997756958008, 14.603750228881836, 15.630502700805664, 16.657255172729492, 17.684005737304688, 18.710758209228516, 19.737510681152344, 20.764263153076172, 21.791015625, 22.817768096923828, 23.844520568847656, 24.871273040771484, 25.898025512695312, 26.924776077270508, 27.951528549194336, 28.978281021118164, 30.005033493041992, 31.031784057617188]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 2.0, 2.0, 3.0, 11.0, 7.0, 11.0, 17.0, 21.0, 13.0, 19.0, 35.0, 28.0, 15.0, 31.0, 43.0, 39.0, 41.0, 48.0, 46.0, 41.0, 49.0, 46.0, 52.0, 31.0, 41.0, 38.0, 33.0, 39.0, 32.0, 28.0, 20.0, 25.0, 23.0, 19.0, 14.0, 11.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.734375, -4.6068115234375, -4.479248046875, -4.3516845703125, -4.22412109375, -4.0965576171875, -3.968994140625, -3.8414306640625, -3.7138671875, -3.5863037109375, -3.458740234375, -3.3311767578125, -3.20361328125, -3.0760498046875, -2.948486328125, -2.8209228515625, -2.693359375, -2.5657958984375, -2.438232421875, -2.3106689453125, -2.18310546875, -2.0555419921875, -1.927978515625, -1.8004150390625, -1.6728515625, -1.5452880859375, -1.417724609375, -1.2901611328125, -1.16259765625, -1.0350341796875, -0.907470703125, -0.7799072265625, -0.65234375, -0.5247802734375, -0.397216796875, -0.2696533203125, -0.14208984375, -0.0145263671875, 0.113037109375, 0.2406005859375, 0.3681640625, 0.4957275390625, 0.623291015625, 0.7508544921875, 0.87841796875, 1.0059814453125, 1.133544921875, 1.2611083984375, 1.388671875, 1.5162353515625, 1.643798828125, 1.7713623046875, 1.89892578125, 2.0264892578125, 2.154052734375, 2.2816162109375, 2.4091796875, 2.5367431640625, 2.664306640625, 2.7918701171875, 2.91943359375, 3.0469970703125, 3.174560546875, 3.3021240234375, 3.4296875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 10.0, 20.0, 19.0, 29.0, 53.0, 50.0, 105.0, 162.0, 225.0, 373.0, 530.0, 776.0, 1176.0, 1802.0, 2630.0, 4127.0, 6425.0, 9639.0, 15333.0, 24459.0, 40418.0, 67592.0, 111361.0, 172249.0, 199800.0, 149279.0, 92860.0, 55522.0, 33646.0, 20846.0, 13059.0, 8323.0, 5360.0, 3442.0, 2306.0, 1493.0, 1034.0, 643.0, 435.0, 292.0, 211.0, 141.0, 113.0, 66.0, 41.0, 27.0, 15.0, 20.0, 9.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.398681640625, -0.38634490966796875, -0.3740081787109375, -0.36167144775390625, -0.349334716796875, -0.33699798583984375, -0.3246612548828125, -0.31232452392578125, -0.29998779296875, -0.28765106201171875, -0.2753143310546875, -0.26297760009765625, -0.250640869140625, -0.23830413818359375, -0.2259674072265625, -0.21363067626953125, -0.2012939453125, -0.18895721435546875, -0.1766204833984375, -0.16428375244140625, -0.151947021484375, -0.13961029052734375, -0.1272735595703125, -0.11493682861328125, -0.10260009765625, -0.09026336669921875, -0.0779266357421875, -0.06558990478515625, -0.053253173828125, -0.04091644287109375, -0.0285797119140625, -0.01624298095703125, -0.00390625, 0.00843048095703125, 0.0207672119140625, 0.03310394287109375, 0.045440673828125, 0.05777740478515625, 0.0701141357421875, 0.08245086669921875, 0.09478759765625, 0.10712432861328125, 0.1194610595703125, 0.13179779052734375, 0.144134521484375, 0.15647125244140625, 0.1688079833984375, 0.18114471435546875, 0.1934814453125, 0.20581817626953125, 0.2181549072265625, 0.23049163818359375, 0.242828369140625, 0.25516510009765625, 0.2675018310546875, 0.27983856201171875, 0.29217529296875, 0.30451202392578125, 0.3168487548828125, 0.32918548583984375, 0.341522216796875, 0.35385894775390625, 0.3661956787109375, 0.37853240966796875, 0.390869140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 8.0, 10.0, 5.0, 11.0, 13.0, 19.0, 23.0, 19.0, 21.0, 29.0, 26.0, 21.0, 36.0, 37.0, 32.0, 31.0, 36.0, 27.0, 52.0, 1071.0, 39.0, 25.0, 39.0, 44.0, 38.0, 36.0, 22.0, 26.0, 24.0, 28.0, 23.0, 29.0, 14.0, 16.0, 11.0, 13.0, 10.0, 11.0, 11.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.31640625, -2.246856689453125, -2.17730712890625, -2.107757568359375, -2.0382080078125, -1.968658447265625, -1.89910888671875, -1.829559326171875, -1.760009765625, -1.690460205078125, -1.62091064453125, -1.551361083984375, -1.4818115234375, -1.412261962890625, -1.34271240234375, -1.273162841796875, -1.20361328125, -1.134063720703125, -1.06451416015625, -0.994964599609375, -0.9254150390625, -0.855865478515625, -0.78631591796875, -0.716766357421875, -0.647216796875, -0.577667236328125, -0.50811767578125, -0.438568115234375, -0.3690185546875, -0.299468994140625, -0.22991943359375, -0.160369873046875, -0.0908203125, -0.021270751953125, 0.04827880859375, 0.117828369140625, 0.1873779296875, 0.256927490234375, 0.32647705078125, 0.396026611328125, 0.465576171875, 0.535125732421875, 0.60467529296875, 0.674224853515625, 0.7437744140625, 0.813323974609375, 0.88287353515625, 0.952423095703125, 1.02197265625, 1.091522216796875, 1.16107177734375, 1.230621337890625, 1.3001708984375, 1.369720458984375, 1.43927001953125, 1.508819580078125, 1.578369140625, 1.647918701171875, 1.71746826171875, 1.787017822265625, 1.8565673828125, 1.926116943359375, 1.99566650390625, 2.065216064453125, 2.134765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 2.0, 8.0, 6.0, 9.0, 9.0, 11.0, 36.0, 44.0, 70.0, 89.0, 154.0, 216.0, 313.0, 426.0, 684.0, 1119.0, 1605.0, 2515.0, 3747.0, 5775.0, 9153.0, 13909.0, 21791.0, 33936.0, 53403.0, 83035.0, 122401.0, 184683.0, 1184701.0, 128063.0, 87529.0, 56515.0, 36103.0, 22957.0, 14693.0, 9391.0, 6238.0, 3999.0, 2666.0, 1728.0, 1116.0, 758.0, 522.0, 297.0, 241.0, 154.0, 100.0, 65.0, 57.0, 40.0, 25.0, 11.0, 9.0, 2.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.265869140625, -0.25757598876953125, -0.2492828369140625, -0.24098968505859375, -0.232696533203125, -0.22440338134765625, -0.2161102294921875, -0.20781707763671875, -0.19952392578125, -0.19123077392578125, -0.1829376220703125, -0.17464447021484375, -0.166351318359375, -0.15805816650390625, -0.1497650146484375, -0.14147186279296875, -0.1331787109375, -0.12488555908203125, -0.1165924072265625, -0.10829925537109375, -0.100006103515625, -0.09171295166015625, -0.0834197998046875, -0.07512664794921875, -0.06683349609375, -0.05854034423828125, -0.0502471923828125, -0.04195404052734375, -0.033660888671875, -0.02536773681640625, -0.0170745849609375, -0.00878143310546875, -0.00048828125, 0.00780487060546875, 0.0160980224609375, 0.02439117431640625, 0.032684326171875, 0.04097747802734375, 0.0492706298828125, 0.05756378173828125, 0.06585693359375, 0.07415008544921875, 0.0824432373046875, 0.09073638916015625, 0.099029541015625, 0.10732269287109375, 0.1156158447265625, 0.12390899658203125, 0.1322021484375, 0.14049530029296875, 0.1487884521484375, 0.15708160400390625, 0.165374755859375, 0.17366790771484375, 0.1819610595703125, 0.19025421142578125, 0.19854736328125, 0.20684051513671875, 0.2151336669921875, 0.22342681884765625, 0.231719970703125, 0.24001312255859375, 0.2483062744140625, 0.25659942626953125, 0.264892578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 7.0, 15.0, 17.0, 22.0, 28.0, 24.0, 34.0, 48.0, 31.0, 40.0, 54.0, 52.0, 66.0, 69.0, 55.0, 65.0, 55.0, 50.0, 37.0, 31.0, 25.0, 38.0, 11.0, 19.0, 17.0, 12.0, 10.0, 5.0, 8.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0010013580322265625, -0.0009725242853164673, -0.0009436905384063721, -0.0009148567914962769, -0.0008860230445861816, -0.0008571892976760864, -0.0008283555507659912, -0.000799521803855896, -0.0007706880569458008, -0.0007418543100357056, -0.0007130205631256104, -0.0006841868162155151, -0.0006553530693054199, -0.0006265193223953247, -0.0005976855754852295, -0.0005688518285751343, -0.0005400180816650391, -0.0005111843347549438, -0.00048235058784484863, -0.0004535168409347534, -0.0004246830940246582, -0.000395849347114563, -0.0003670156002044678, -0.00033818185329437256, -0.00030934810638427734, -0.00028051435947418213, -0.0002516806125640869, -0.0002228468656539917, -0.00019401311874389648, -0.00016517937183380127, -0.00013634562492370605, -0.00010751187801361084, -7.867813110351562e-05, -4.984438419342041e-05, -2.1010637283325195e-05, 7.82310962677002e-06, 3.6656856536865234e-05, 6.549060344696045e-05, 9.432435035705566e-05, 0.00012315809726715088, 0.0001519918441772461, 0.0001808255910873413, 0.00020965933799743652, 0.00023849308490753174, 0.00026732683181762695, 0.00029616057872772217, 0.0003249943256378174, 0.0003538280725479126, 0.0003826618194580078, 0.00041149556636810303, 0.00044032931327819824, 0.00046916306018829346, 0.0004979968070983887, 0.0005268305540084839, 0.0005556643009185791, 0.0005844980478286743, 0.0006133317947387695, 0.0006421655416488647, 0.00067099928855896, 0.0006998330354690552, 0.0007286667823791504, 0.0007575005292892456, 0.0007863342761993408, 0.000815168023109436, 0.0008440017700195312]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 10.0, 7.0, 11.0, 13.0, 22.0, 21.0, 31.0, 30.0, 39.0, 55.0, 63.0, 103.0, 157.0, 195.0, 305.0, 570.0, 3645.0, 470272.0, 567181.0, 4188.0, 607.0, 318.0, 182.0, 122.0, 86.0, 81.0, 57.0, 48.0, 31.0, 19.0, 16.0, 13.0, 13.0, 11.0, 8.0, 3.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016571044921875, -0.016019105911254883, -0.015467166900634766, -0.014915227890014648, -0.014363288879394531, -0.013811349868774414, -0.013259410858154297, -0.01270747184753418, -0.012155532836914062, -0.011603593826293945, -0.011051654815673828, -0.010499715805053711, -0.009947776794433594, -0.009395837783813477, -0.00884389877319336, -0.008291959762573242, -0.007740020751953125, -0.007188081741333008, -0.006636142730712891, -0.0060842037200927734, -0.005532264709472656, -0.004980325698852539, -0.004428386688232422, -0.0038764476776123047, -0.0033245086669921875, -0.0027725696563720703, -0.002220630645751953, -0.001668691635131836, -0.0011167526245117188, -0.0005648136138916016, -1.2874603271484375e-05, 0.0005390644073486328, 0.00109100341796875, 0.0016429424285888672, 0.0021948814392089844, 0.0027468204498291016, 0.0032987594604492188, 0.003850698471069336, 0.004402637481689453, 0.00495457649230957, 0.0055065155029296875, 0.006058454513549805, 0.006610393524169922, 0.007162332534790039, 0.007714271545410156, 0.008266210556030273, 0.00881814956665039, 0.009370088577270508, 0.009922027587890625, 0.010473966598510742, 0.01102590560913086, 0.011577844619750977, 0.012129783630371094, 0.012681722640991211, 0.013233661651611328, 0.013785600662231445, 0.014337539672851562, 0.01488947868347168, 0.015441417694091797, 0.015993356704711914, 0.01654529571533203, 0.01709723472595215, 0.017649173736572266, 0.018201112747192383, 0.0187530517578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 41.0, 444.0, 486.0, 44.0], "bins": [-0.009929399937391281, -0.009769328869879246, -0.00960925780236721, -0.009449186734855175, -0.00928911566734314, -0.009129044599831104, -0.008968973532319069, -0.008808901533484459, -0.008648830465972424, -0.008488759398460388, -0.008328688330948353, -0.008168617263436317, -0.008008546195924282, -0.007848475128412247, -0.007688403595238924, -0.007528332527726889, -0.007368261925876141, -0.007208190858364105, -0.00704811979085207, -0.0068880487233400345, -0.006727977190166712, -0.0065679061226546764, -0.006407835055142641, -0.006247763987630606, -0.006087692454457283, -0.005927621386945248, -0.005767550319433212, -0.005607479251921177, -0.005447407718747854, -0.005287336651235819, -0.0051272655837237835, -0.004967194516211748, -0.004807123448699713, -0.004647052381187677, -0.004486981313675642, -0.004326909780502319, -0.004166838712990284, -0.004006767645478249, -0.0038466965779662132, -0.003686625510454178, -0.0035265544429421425, -0.003366483375430107, -0.003206412075087428, -0.0030463410075753927, -0.0028862699400633574, -0.0027261986397206783, -0.002566127572208643, -0.0024060565046966076, -0.0022459852043539286, -0.002085914136841893, -0.001925842952914536, -0.0017657717689871788, -0.0016057007014751434, -0.0014456295175477862, -0.001285558333620429, -0.0011254872661083937, -0.0009654160821810365, -0.0008053449564613402, -0.0006452738307416439, -0.0004852026468142867, -0.0003251315210945904, -0.00016506039537489414, -4.989211447536945e-06, 0.00015508185606449842, 0.0003151530399918556]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 4.0, 18.0, 14.0, 15.0, 13.0, 23.0, 20.0, 19.0, 25.0, 33.0, 24.0, 40.0, 29.0, 50.0, 47.0, 42.0, 42.0, 45.0, 50.0, 35.0, 50.0, 36.0, 33.0, 29.0, 36.0, 33.0, 31.0, 30.0, 20.0, 17.0, 20.0, 14.0, 12.0, 6.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041961669921875, -0.0004038959741592407, -0.00038817524909973145, -0.00037245452404022217, -0.0003567337989807129, -0.0003410130739212036, -0.00032529234886169434, -0.00030957162380218506, -0.0002938508987426758, -0.0002781301736831665, -0.0002624094486236572, -0.00024668872356414795, -0.00023096799850463867, -0.0002152472734451294, -0.00019952654838562012, -0.00018380582332611084, -0.00016808509826660156, -0.00015236437320709229, -0.000136643648147583, -0.00012092292308807373, -0.00010520219802856445, -8.948147296905518e-05, -7.37607479095459e-05, -5.804002285003662e-05, -4.2319297790527344e-05, -2.6598572731018066e-05, -1.0877847671508789e-05, 4.842877388000488e-06, 2.0563602447509766e-05, 3.628432750701904e-05, 5.200505256652832e-05, 6.77257776260376e-05, 8.344650268554688e-05, 9.916722774505615e-05, 0.00011488795280456543, 0.0001306086778640747, 0.00014632940292358398, 0.00016205012798309326, 0.00017777085304260254, 0.00019349157810211182, 0.0002092123031616211, 0.00022493302822113037, 0.00024065375328063965, 0.0002563744783401489, 0.0002720952033996582, 0.0002878159284591675, 0.00030353665351867676, 0.00031925737857818604, 0.0003349781036376953, 0.0003506988286972046, 0.00036641955375671387, 0.00038214027881622314, 0.0003978610038757324, 0.0004135817289352417, 0.000429302453994751, 0.00044502317905426025, 0.00046074390411376953, 0.0004764646291732788, 0.0004921853542327881, 0.0005079060792922974, 0.0005236268043518066, 0.0005393475294113159, 0.0005550682544708252, 0.0005707889795303345, 0.0005865097045898438]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 2.0, 2.0, 3.0, 11.0, 7.0, 11.0, 17.0, 21.0, 13.0, 19.0, 35.0, 28.0, 15.0, 31.0, 43.0, 39.0, 41.0, 48.0, 46.0, 40.0, 50.0, 46.0, 52.0, 31.0, 41.0, 38.0, 33.0, 39.0, 32.0, 28.0, 20.0, 25.0, 23.0, 19.0, 14.0, 11.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.734375, -4.6068115234375, -4.479248046875, -4.3516845703125, -4.22412109375, -4.0965576171875, -3.968994140625, -3.8414306640625, -3.7138671875, -3.5863037109375, -3.458740234375, -3.3311767578125, -3.20361328125, -3.0760498046875, -2.948486328125, -2.8209228515625, -2.693359375, -2.5657958984375, -2.438232421875, -2.3106689453125, -2.18310546875, -2.0555419921875, -1.927978515625, -1.8004150390625, -1.6728515625, -1.5452880859375, -1.417724609375, -1.2901611328125, -1.16259765625, -1.0350341796875, -0.907470703125, -0.7799072265625, -0.65234375, -0.5247802734375, -0.397216796875, -0.2696533203125, -0.14208984375, -0.0145263671875, 0.113037109375, 0.2406005859375, 0.3681640625, 0.4957275390625, 0.623291015625, 0.7508544921875, 0.87841796875, 1.0059814453125, 1.133544921875, 1.2611083984375, 1.388671875, 1.5162353515625, 1.643798828125, 1.7713623046875, 1.89892578125, 2.0264892578125, 2.154052734375, 2.2816162109375, 2.4091796875, 2.5367431640625, 2.664306640625, 2.7918701171875, 2.91943359375, 3.0469970703125, 3.174560546875, 3.3021240234375, 3.4296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 6.0, 12.0, 17.0, 40.0, 55.0, 80.0, 108.0, 190.0, 281.0, 504.0, 693.0, 1235.0, 2192.0, 3542.0, 6616.0, 13194.0, 29266.0, 77311.0, 219814.0, 383117.0, 190740.0, 67208.0, 26029.0, 11668.0, 6128.0, 3386.0, 1987.0, 1186.0, 681.0, 476.0, 251.0, 181.0, 118.0, 82.0, 49.0, 37.0, 24.0, 12.0, 9.0, 3.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.04296875, -2.959442138671875, -2.87591552734375, -2.792388916015625, -2.7088623046875, -2.625335693359375, -2.54180908203125, -2.458282470703125, -2.374755859375, -2.291229248046875, -2.20770263671875, -2.124176025390625, -2.0406494140625, -1.957122802734375, -1.87359619140625, -1.790069580078125, -1.70654296875, -1.623016357421875, -1.53948974609375, -1.455963134765625, -1.3724365234375, -1.288909912109375, -1.20538330078125, -1.121856689453125, -1.038330078125, -0.954803466796875, -0.87127685546875, -0.787750244140625, -0.7042236328125, -0.620697021484375, -0.53717041015625, -0.453643798828125, -0.3701171875, -0.286590576171875, -0.20306396484375, -0.119537353515625, -0.0360107421875, 0.047515869140625, 0.13104248046875, 0.214569091796875, 0.298095703125, 0.381622314453125, 0.46514892578125, 0.548675537109375, 0.6322021484375, 0.715728759765625, 0.79925537109375, 0.882781982421875, 0.96630859375, 1.049835205078125, 1.13336181640625, 1.216888427734375, 1.3004150390625, 1.383941650390625, 1.46746826171875, 1.550994873046875, 1.634521484375, 1.718048095703125, 1.80157470703125, 1.885101318359375, 1.9686279296875, 2.052154541015625, 2.13568115234375, 2.219207763671875, 2.302734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 7.0, 12.0, 5.0, 17.0, 14.0, 17.0, 21.0, 30.0, 28.0, 40.0, 30.0, 40.0, 39.0, 46.0, 41.0, 70.0, 268.0, 1653.0, 175.0, 74.0, 50.0, 52.0, 44.0, 38.0, 32.0, 32.0, 19.0, 21.0, 23.0, 20.0, 14.0, 12.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.52197265625, -13.0908203125, -12.65966796875, -12.228515625, -11.79736328125, -11.3662109375, -10.93505859375, -10.50390625, -10.07275390625, -9.6416015625, -9.21044921875, -8.779296875, -8.34814453125, -7.9169921875, -7.48583984375, -7.0546875, -6.62353515625, -6.1923828125, -5.76123046875, -5.330078125, -4.89892578125, -4.4677734375, -4.03662109375, -3.60546875, -3.17431640625, -2.7431640625, -2.31201171875, -1.880859375, -1.44970703125, -1.0185546875, -0.58740234375, -0.15625, 0.27490234375, 0.7060546875, 1.13720703125, 1.568359375, 1.99951171875, 2.4306640625, 2.86181640625, 3.29296875, 3.72412109375, 4.1552734375, 4.58642578125, 5.017578125, 5.44873046875, 5.8798828125, 6.31103515625, 6.7421875, 7.17333984375, 7.6044921875, 8.03564453125, 8.466796875, 8.89794921875, 9.3291015625, 9.76025390625, 10.19140625, 10.62255859375, 11.0537109375, 11.48486328125, 11.916015625, 12.34716796875, 12.7783203125, 13.20947265625, 13.640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 1.0, 7.0, 10.0, 9.0, 10.0, 21.0, 20.0, 36.0, 29.0, 47.0, 61.0, 93.0, 142.0, 246.0, 519.0, 1580.0, 22637.0, 3076970.0, 39973.0, 1909.0, 565.0, 257.0, 147.0, 91.0, 86.0, 62.0, 42.0, 29.0, 26.0, 13.0, 11.0, 15.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.78125, -27.971923828125, -27.16259765625, -26.353271484375, -25.5439453125, -24.734619140625, -23.92529296875, -23.115966796875, -22.306640625, -21.497314453125, -20.68798828125, -19.878662109375, -19.0693359375, -18.260009765625, -17.45068359375, -16.641357421875, -15.83203125, -15.022705078125, -14.21337890625, -13.404052734375, -12.5947265625, -11.785400390625, -10.97607421875, -10.166748046875, -9.357421875, -8.548095703125, -7.73876953125, -6.929443359375, -6.1201171875, -5.310791015625, -4.50146484375, -3.692138671875, -2.8828125, -2.073486328125, -1.26416015625, -0.454833984375, 0.3544921875, 1.163818359375, 1.97314453125, 2.782470703125, 3.591796875, 4.401123046875, 5.21044921875, 6.019775390625, 6.8291015625, 7.638427734375, 8.44775390625, 9.257080078125, 10.06640625, 10.875732421875, 11.68505859375, 12.494384765625, 13.3037109375, 14.113037109375, 14.92236328125, 15.731689453125, 16.541015625, 17.350341796875, 18.15966796875, 18.968994140625, 19.7783203125, 20.587646484375, 21.39697265625, 22.206298828125, 23.015625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 14.0, 927.0, 76.0, 0.0, 1.0], "bins": [-343.09576416015625, -337.4305114746094, -331.7652587890625, -326.0999755859375, -320.4347229003906, -314.76947021484375, -309.1042175292969, -303.43896484375, -297.773681640625, -292.1084289550781, -286.44317626953125, -280.77789306640625, -275.1126403808594, -269.4473876953125, -263.7821350097656, -258.11688232421875, -252.45162963867188, -246.786376953125, -241.12110900878906, -235.4558563232422, -229.79058837890625, -224.12533569335938, -218.4600830078125, -212.79483032226562, -207.1295623779297, -201.4643096923828, -195.79904174804688, -190.1337890625, -184.46853637695312, -178.8032684326172, -173.1380157470703, -167.47274780273438, -161.80751037597656, -156.1422576904297, -150.47698974609375, -144.81173706054688, -139.146484375, -133.48121643066406, -127.81596374511719, -122.15070343017578, -116.48544311523438, -110.82018280029297, -105.15492248535156, -99.48966979980469, -93.82440948486328, -88.15914916992188, -82.493896484375, -76.8286361694336, -71.16337585449219, -65.49811553955078, -59.83285903930664, -54.1676025390625, -48.502342224121094, -42.83708190917969, -37.17182540893555, -31.506568908691406, -25.841306686401367, -20.176048278808594, -14.51078987121582, -8.845531463623047, -3.1802730560302734, 2.4849853515625, 8.150243759155273, 13.815500259399414, 19.48076057434082]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 19.0, 16.0, 10.0, 12.0, 16.0, 17.0, 15.0, 18.0, 22.0, 16.0, 24.0, 36.0, 40.0, 40.0, 30.0, 45.0, 38.0, 33.0, 39.0, 30.0, 30.0, 49.0, 38.0, 27.0, 34.0, 32.0, 27.0, 18.0, 24.0, 26.0, 29.0, 15.0, 16.0, 13.0, 15.0, 19.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-38.482540130615234, -37.325347900390625, -36.16815185546875, -35.01095962524414, -33.853763580322266, -32.696571350097656, -31.539377212524414, -30.382183074951172, -29.22498893737793, -28.067794799804688, -26.910600662231445, -25.753406524658203, -24.596214294433594, -23.43901824951172, -22.28182601928711, -21.124631881713867, -19.967437744140625, -18.810243606567383, -17.65304946899414, -16.4958553314209, -15.338662147521973, -14.18146800994873, -13.024274826049805, -11.867080688476562, -10.70988655090332, -9.552692413330078, -8.395498275756836, -7.23830509185791, -6.081110954284668, -4.923916816711426, -3.766723155975342, -2.609529495239258, -1.4523353576660156, -0.29514145851135254, 0.8620524406433105, 2.0192463397979736, 3.1764402389526367, 4.333634376525879, 5.490828037261963, 6.648021697998047, 7.805215835571289, 8.962409973144531, 10.119604110717773, 11.2767972946167, 12.433991432189941, 13.591185569763184, 14.74837875366211, 15.905572891235352, 17.062767028808594, 18.219961166381836, 19.377155303955078, 20.53434944152832, 21.691543579101562, 22.848735809326172, 24.005929946899414, 25.163124084472656, 26.3203182220459, 27.47751235961914, 28.634706497192383, 29.791900634765625, 30.949092864990234, 32.10628890991211, 33.26348114013672, 34.420677185058594, 35.5778694152832]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 6.0, 12.0, 7.0, 14.0, 14.0, 19.0, 19.0, 33.0, 19.0, 26.0, 23.0, 20.0, 40.0, 34.0, 53.0, 53.0, 40.0, 55.0, 40.0, 52.0, 45.0, 29.0, 34.0, 42.0, 37.0, 32.0, 32.0, 27.0, 22.0, 19.0, 22.0, 20.0, 11.0, 10.0, 10.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.75, -4.62127685546875, -4.4925537109375, -4.36383056640625, -4.235107421875, -4.10638427734375, -3.9776611328125, -3.84893798828125, -3.72021484375, -3.59149169921875, -3.4627685546875, -3.33404541015625, -3.205322265625, -3.07659912109375, -2.9478759765625, -2.81915283203125, -2.6904296875, -2.56170654296875, -2.4329833984375, -2.30426025390625, -2.175537109375, -2.04681396484375, -1.9180908203125, -1.78936767578125, -1.66064453125, -1.53192138671875, -1.4031982421875, -1.27447509765625, -1.145751953125, -1.01702880859375, -0.8883056640625, -0.75958251953125, -0.630859375, -0.50213623046875, -0.3734130859375, -0.24468994140625, -0.115966796875, 0.01275634765625, 0.1414794921875, 0.27020263671875, 0.39892578125, 0.52764892578125, 0.6563720703125, 0.78509521484375, 0.913818359375, 1.04254150390625, 1.1712646484375, 1.29998779296875, 1.4287109375, 1.55743408203125, 1.6861572265625, 1.81488037109375, 1.943603515625, 2.07232666015625, 2.2010498046875, 2.32977294921875, 2.45849609375, 2.58721923828125, 2.7159423828125, 2.84466552734375, 2.973388671875, 3.10211181640625, 3.2308349609375, 3.35955810546875, 3.48828125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 8.0, 10.0, 9.0, 13.0, 9.0, 22.0, 21.0, 40.0, 49.0, 69.0, 99.0, 201.0, 439.0, 1617.0, 8985.0, 73562.0, 1108855.0, 2709913.0, 261128.0, 24111.0, 3608.0, 770.0, 286.0, 136.0, 88.0, 52.0, 31.0, 25.0, 23.0, 22.0, 19.0, 13.0, 11.0, 9.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.414794921875, -14.01708984375, -13.619384765625, -13.2216796875, -12.823974609375, -12.42626953125, -12.028564453125, -11.630859375, -11.233154296875, -10.83544921875, -10.437744140625, -10.0400390625, -9.642333984375, -9.24462890625, -8.846923828125, -8.44921875, -8.051513671875, -7.65380859375, -7.256103515625, -6.8583984375, -6.460693359375, -6.06298828125, -5.665283203125, -5.267578125, -4.869873046875, -4.47216796875, -4.074462890625, -3.6767578125, -3.279052734375, -2.88134765625, -2.483642578125, -2.0859375, -1.688232421875, -1.29052734375, -0.892822265625, -0.4951171875, -0.097412109375, 0.30029296875, 0.697998046875, 1.095703125, 1.493408203125, 1.89111328125, 2.288818359375, 2.6865234375, 3.084228515625, 3.48193359375, 3.879638671875, 4.27734375, 4.675048828125, 5.07275390625, 5.470458984375, 5.8681640625, 6.265869140625, 6.66357421875, 7.061279296875, 7.458984375, 7.856689453125, 8.25439453125, 8.652099609375, 9.0498046875, 9.447509765625, 9.84521484375, 10.242919921875, 10.640625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 17.0, 19.0, 33.0, 62.0, 112.0, 120.0, 166.0, 241.0, 343.0, 491.0, 571.0, 515.0, 404.0, 300.0, 202.0, 142.0, 114.0, 74.0, 50.0, 29.0, 21.0, 10.0, 9.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -16.0213623046875, -15.573974609375, -15.1265869140625, -14.67919921875, -14.2318115234375, -13.784423828125, -13.3370361328125, -12.8896484375, -12.4422607421875, -11.994873046875, -11.5474853515625, -11.10009765625, -10.6527099609375, -10.205322265625, -9.7579345703125, -9.310546875, -8.8631591796875, -8.415771484375, -7.9683837890625, -7.52099609375, -7.0736083984375, -6.626220703125, -6.1788330078125, -5.7314453125, -5.2840576171875, -4.836669921875, -4.3892822265625, -3.94189453125, -3.4945068359375, -3.047119140625, -2.5997314453125, -2.15234375, -1.7049560546875, -1.257568359375, -0.8101806640625, -0.36279296875, 0.0845947265625, 0.531982421875, 0.9793701171875, 1.4267578125, 1.8741455078125, 2.321533203125, 2.7689208984375, 3.21630859375, 3.6636962890625, 4.111083984375, 4.5584716796875, 5.005859375, 5.4532470703125, 5.900634765625, 6.3480224609375, 6.79541015625, 7.2427978515625, 7.690185546875, 8.1375732421875, 8.5849609375, 9.0323486328125, 9.479736328125, 9.9271240234375, 10.37451171875, 10.8218994140625, 11.269287109375, 11.7166748046875, 12.1640625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 24.0, 15.0, 25.0, 34.0, 38.0, 65.0, 87.0, 106.0, 183.0, 258.0, 583.0, 1667.0, 14588.0, 607134.0, 3474986.0, 88043.0, 4374.0, 930.0, 399.0, 214.0, 159.0, 81.0, 62.0, 53.0, 45.0, 24.0, 25.0, 13.0, 10.0, 12.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.58154296875, -30.5380859375, -29.49462890625, -28.451171875, -27.40771484375, -26.3642578125, -25.32080078125, -24.27734375, -23.23388671875, -22.1904296875, -21.14697265625, -20.103515625, -19.06005859375, -18.0166015625, -16.97314453125, -15.9296875, -14.88623046875, -13.8427734375, -12.79931640625, -11.755859375, -10.71240234375, -9.6689453125, -8.62548828125, -7.58203125, -6.53857421875, -5.4951171875, -4.45166015625, -3.408203125, -2.36474609375, -1.3212890625, -0.27783203125, 0.765625, 1.80908203125, 2.8525390625, 3.89599609375, 4.939453125, 5.98291015625, 7.0263671875, 8.06982421875, 9.11328125, 10.15673828125, 11.2001953125, 12.24365234375, 13.287109375, 14.33056640625, 15.3740234375, 16.41748046875, 17.4609375, 18.50439453125, 19.5478515625, 20.59130859375, 21.634765625, 22.67822265625, 23.7216796875, 24.76513671875, 25.80859375, 26.85205078125, 27.8955078125, 28.93896484375, 29.982421875, 31.02587890625, 32.0693359375, 33.11279296875, 34.15625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 11.0, 35.0, 111.0, 181.0, 272.0, 226.0, 115.0, 42.0, 12.0, 10.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.71157455444336, -36.8895263671875, -33.06747817993164, -29.24542999267578, -25.423381805419922, -21.601333618164062, -17.779285430908203, -13.957237243652344, -10.135189056396484, -6.313140869140625, -2.4910926818847656, 1.3309555053710938, 5.153003692626953, 8.975051879882812, 12.797100067138672, 16.61914825439453, 20.44119644165039, 24.26324462890625, 28.08529281616211, 31.90734100341797, 35.72938919067383, 39.55143737792969, 43.37348556518555, 47.195533752441406, 51.017581939697266, 54.839630126953125, 58.661678314208984, 62.483726501464844, 66.30577087402344, 70.12782287597656, 73.94987487792969, 77.77191925048828, 81.59396362304688, 85.416015625, 89.2380599975586, 93.06010437011719, 96.88215637207031, 100.70420837402344, 104.52625274658203, 108.34829711914062, 112.17034912109375, 115.99240112304688, 119.81444549560547, 123.63648986816406, 127.45854187011719, 131.2805938720703, 135.10263061523438, 138.9246826171875, 142.74673461914062, 146.56878662109375, 150.39083862304688, 154.21287536621094, 158.03492736816406, 161.8569793701172, 165.67901611328125, 169.50106811523438, 173.3231201171875, 177.14517211914062, 180.96722412109375, 184.7892608642578, 188.61131286621094, 192.43336486816406, 196.25540161132812, 200.07745361328125, 203.89950561523438]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 6.0, 14.0, 13.0, 14.0, 19.0, 16.0, 23.0, 24.0, 21.0, 29.0, 34.0, 30.0, 33.0, 27.0, 37.0, 33.0, 30.0, 42.0, 47.0, 48.0, 39.0, 34.0, 34.0, 32.0, 31.0, 36.0, 33.0, 22.0, 25.0, 25.0, 25.0, 14.0, 19.0, 11.0, 11.0, 8.0, 10.0, 6.0, 7.0, 8.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.23828125, -29.138547897338867, -28.038814544677734, -26.9390811920166, -25.83934783935547, -24.739614486694336, -23.639881134033203, -22.54014778137207, -21.440414428710938, -20.340681076049805, -19.240947723388672, -18.14121437072754, -17.041481018066406, -15.941747665405273, -14.84201431274414, -13.742280960083008, -12.642547607421875, -11.542814254760742, -10.44308090209961, -9.343347549438477, -8.243614196777344, -7.143880844116211, -6.044147491455078, -4.944414138793945, -3.8446807861328125, -2.7449474334716797, -1.6452140808105469, -0.5454807281494141, 0.5542526245117188, 1.6539859771728516, 2.7537193298339844, 3.853452682495117, 4.95318603515625, 6.052919387817383, 7.152652740478516, 8.252386093139648, 9.352119445800781, 10.451852798461914, 11.551586151123047, 12.65131950378418, 13.751052856445312, 14.850786209106445, 15.950519561767578, 17.05025291442871, 18.149986267089844, 19.249719619750977, 20.34945297241211, 21.449186325073242, 22.548919677734375, 23.648653030395508, 24.74838638305664, 25.848119735717773, 26.947853088378906, 28.04758644104004, 29.147319793701172, 30.247053146362305, 31.346786499023438, 32.44651794433594, 33.5462532043457, 34.64598846435547, 35.74571990966797, 36.84545135498047, 37.945186614990234, 39.044921875, 40.1446533203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 2.0, 5.0, 11.0, 12.0, 21.0, 22.0, 24.0, 21.0, 30.0, 29.0, 33.0, 26.0, 21.0, 34.0, 39.0, 45.0, 50.0, 39.0, 41.0, 43.0, 43.0, 45.0, 37.0, 34.0, 29.0, 37.0, 38.0, 20.0, 21.0, 21.0, 18.0, 21.0, 13.0, 14.0, 5.0, 13.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0], "bins": [-4.859375, -4.734893798828125, -4.61041259765625, -4.485931396484375, -4.3614501953125, -4.236968994140625, -4.11248779296875, -3.988006591796875, -3.863525390625, -3.739044189453125, -3.61456298828125, -3.490081787109375, -3.3656005859375, -3.241119384765625, -3.11663818359375, -2.992156982421875, -2.86767578125, -2.743194580078125, -2.61871337890625, -2.494232177734375, -2.3697509765625, -2.245269775390625, -2.12078857421875, -1.996307373046875, -1.871826171875, -1.747344970703125, -1.62286376953125, -1.498382568359375, -1.3739013671875, -1.249420166015625, -1.12493896484375, -1.000457763671875, -0.8759765625, -0.751495361328125, -0.62701416015625, -0.502532958984375, -0.3780517578125, -0.253570556640625, -0.12908935546875, -0.004608154296875, 0.119873046875, 0.244354248046875, 0.36883544921875, 0.493316650390625, 0.6177978515625, 0.742279052734375, 0.86676025390625, 0.991241455078125, 1.11572265625, 1.240203857421875, 1.36468505859375, 1.489166259765625, 1.6136474609375, 1.738128662109375, 1.86260986328125, 1.987091064453125, 2.111572265625, 2.236053466796875, 2.36053466796875, 2.485015869140625, 2.6094970703125, 2.733978271484375, 2.85845947265625, 2.982940673828125, 3.107421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 17.0, 24.0, 34.0, 42.0, 55.0, 97.0, 126.0, 181.0, 259.0, 436.0, 700.0, 964.0, 1486.0, 2193.0, 3566.0, 5240.0, 7883.0, 12394.0, 18870.0, 29960.0, 48103.0, 79242.0, 130807.0, 189554.0, 185644.0, 126514.0, 76409.0, 46147.0, 28569.0, 18474.0, 11921.0, 7697.0, 5079.0, 3394.0, 2172.0, 1447.0, 968.0, 640.0, 412.0, 266.0, 181.0, 135.0, 73.0, 62.0, 39.0, 28.0, 14.0, 8.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40380859375, -0.3907661437988281, -0.37772369384765625, -0.3646812438964844, -0.3516387939453125, -0.3385963439941406, -0.32555389404296875, -0.3125114440917969, -0.299468994140625, -0.2864265441894531, -0.27338409423828125, -0.2603416442871094, -0.2472991943359375, -0.23425674438476562, -0.22121429443359375, -0.20817184448242188, -0.19512939453125, -0.18208694458007812, -0.16904449462890625, -0.15600204467773438, -0.1429595947265625, -0.12991714477539062, -0.11687469482421875, -0.10383224487304688, -0.090789794921875, -0.07774734497070312, -0.06470489501953125, -0.051662445068359375, -0.0386199951171875, -0.025577545166015625, -0.01253509521484375, 0.000507354736328125, 0.0135498046875, 0.026592254638671875, 0.03963470458984375, 0.052677154541015625, 0.0657196044921875, 0.07876205444335938, 0.09180450439453125, 0.10484695434570312, 0.117889404296875, 0.13093185424804688, 0.14397430419921875, 0.15701675415039062, 0.1700592041015625, 0.18310165405273438, 0.19614410400390625, 0.20918655395507812, 0.22222900390625, 0.23527145385742188, 0.24831390380859375, 0.2613563537597656, 0.2743988037109375, 0.2874412536621094, 0.30048370361328125, 0.3135261535644531, 0.326568603515625, 0.3396110534667969, 0.35265350341796875, 0.3656959533691406, 0.3787384033203125, 0.3917808532714844, 0.40482330322265625, 0.4178657531738281, 0.430908203125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 8.0, 10.0, 6.0, 8.0, 11.0, 14.0, 24.0, 23.0, 20.0, 28.0, 23.0, 34.0, 19.0, 35.0, 40.0, 37.0, 27.0, 51.0, 35.0, 42.0, 1057.0, 52.0, 43.0, 35.0, 45.0, 45.0, 34.0, 31.0, 17.0, 25.0, 23.0, 24.0, 18.0, 13.0, 8.0, 8.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.517578125, -2.441436767578125, -2.36529541015625, -2.289154052734375, -2.2130126953125, -2.136871337890625, -2.06072998046875, -1.984588623046875, -1.908447265625, -1.832305908203125, -1.75616455078125, -1.680023193359375, -1.6038818359375, -1.527740478515625, -1.45159912109375, -1.375457763671875, -1.29931640625, -1.223175048828125, -1.14703369140625, -1.070892333984375, -0.9947509765625, -0.918609619140625, -0.84246826171875, -0.766326904296875, -0.690185546875, -0.614044189453125, -0.53790283203125, -0.461761474609375, -0.3856201171875, -0.309478759765625, -0.23333740234375, -0.157196044921875, -0.0810546875, -0.004913330078125, 0.07122802734375, 0.147369384765625, 0.2235107421875, 0.299652099609375, 0.37579345703125, 0.451934814453125, 0.528076171875, 0.604217529296875, 0.68035888671875, 0.756500244140625, 0.8326416015625, 0.908782958984375, 0.98492431640625, 1.061065673828125, 1.13720703125, 1.213348388671875, 1.28948974609375, 1.365631103515625, 1.4417724609375, 1.517913818359375, 1.59405517578125, 1.670196533203125, 1.746337890625, 1.822479248046875, 1.89862060546875, 1.974761962890625, 2.0509033203125, 2.127044677734375, 2.20318603515625, 2.279327392578125, 2.35546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 13.0, 15.0, 38.0, 39.0, 56.0, 100.0, 165.0, 221.0, 363.0, 573.0, 944.0, 1583.0, 2718.0, 4609.0, 8053.0, 14289.0, 25237.0, 46155.0, 85369.0, 149664.0, 1260436.0, 201090.0, 131265.0, 73158.0, 39574.0, 22006.0, 12400.0, 6987.0, 4121.0, 2335.0, 1389.0, 789.0, 498.0, 343.0, 179.0, 112.0, 85.0, 42.0, 31.0, 19.0, 17.0, 20.0, 9.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35986328125, -0.34781646728515625, -0.3357696533203125, -0.32372283935546875, -0.311676025390625, -0.29962921142578125, -0.2875823974609375, -0.27553558349609375, -0.26348876953125, -0.25144195556640625, -0.2393951416015625, -0.22734832763671875, -0.215301513671875, -0.20325469970703125, -0.1912078857421875, -0.17916107177734375, -0.1671142578125, -0.15506744384765625, -0.1430206298828125, -0.13097381591796875, -0.118927001953125, -0.10688018798828125, -0.0948333740234375, -0.08278656005859375, -0.07073974609375, -0.05869293212890625, -0.0466461181640625, -0.03459930419921875, -0.022552490234375, -0.01050567626953125, 0.0015411376953125, 0.01358795166015625, 0.025634765625, 0.03768157958984375, 0.0497283935546875, 0.06177520751953125, 0.073822021484375, 0.08586883544921875, 0.0979156494140625, 0.10996246337890625, 0.12200927734375, 0.13405609130859375, 0.1461029052734375, 0.15814971923828125, 0.170196533203125, 0.18224334716796875, 0.1942901611328125, 0.20633697509765625, 0.2183837890625, 0.23043060302734375, 0.2424774169921875, 0.25452423095703125, 0.266571044921875, 0.27861785888671875, 0.2906646728515625, 0.30271148681640625, 0.31475830078125, 0.32680511474609375, 0.3388519287109375, 0.35089874267578125, 0.362945556640625, 0.37499237060546875, 0.3870391845703125, 0.39908599853515625, 0.4111328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 10.0, 9.0, 17.0, 26.0, 23.0, 31.0, 28.0, 51.0, 56.0, 62.0, 73.0, 75.0, 56.0, 62.0, 57.0, 44.0, 59.0, 31.0, 43.0, 28.0, 30.0, 24.0, 14.0, 18.0, 16.0, 11.0, 12.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011186599731445312, -0.0010768920183181763, -0.0010351240634918213, -0.0009933561086654663, -0.0009515881538391113, -0.0009098201990127563, -0.0008680522441864014, -0.0008262842893600464, -0.0007845163345336914, -0.0007427483797073364, -0.0007009804248809814, -0.0006592124700546265, -0.0006174445152282715, -0.0005756765604019165, -0.0005339086055755615, -0.0004921406507492065, -0.00045037269592285156, -0.0004086047410964966, -0.0003668367862701416, -0.0003250688314437866, -0.00028330087661743164, -0.00024153292179107666, -0.00019976496696472168, -0.0001579970121383667, -0.00011622905731201172, -7.446110248565674e-05, -3.269314765930176e-05, 9.074807167053223e-06, 5.08427619934082e-05, 9.261071681976318e-05, 0.00013437867164611816, 0.00017614662647247314, 0.00021791458129882812, 0.0002596825361251831, 0.0003014504909515381, 0.00034321844577789307, 0.00038498640060424805, 0.00042675435543060303, 0.000468522310256958, 0.000510290265083313, 0.000552058219909668, 0.000593826174736023, 0.0006355941295623779, 0.0006773620843887329, 0.0007191300392150879, 0.0007608979940414429, 0.0008026659488677979, 0.0008444339036941528, 0.0008862018585205078, 0.0009279698133468628, 0.0009697377681732178, 0.0010115057229995728, 0.0010532736778259277, 0.0010950416326522827, 0.0011368095874786377, 0.0011785775423049927, 0.0012203454971313477, 0.0012621134519577026, 0.0013038814067840576, 0.0013456493616104126, 0.0013874173164367676, 0.0014291852712631226, 0.0014709532260894775, 0.0015127211809158325, 0.0015544891357421875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 4.0, 9.0, 12.0, 10.0, 17.0, 22.0, 35.0, 38.0, 46.0, 81.0, 117.0, 164.0, 313.0, 731.0, 22462.0, 1019491.0, 3724.0, 532.0, 240.0, 159.0, 103.0, 69.0, 43.0, 32.0, 23.0, 18.0, 18.0, 5.0, 8.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0282745361328125, -0.02737283706665039, -0.02647113800048828, -0.025569438934326172, -0.024667739868164062, -0.023766040802001953, -0.022864341735839844, -0.021962642669677734, -0.021060943603515625, -0.020159244537353516, -0.019257545471191406, -0.018355846405029297, -0.017454147338867188, -0.016552448272705078, -0.01565074920654297, -0.01474905014038086, -0.01384735107421875, -0.01294565200805664, -0.012043952941894531, -0.011142253875732422, -0.010240554809570312, -0.009338855743408203, -0.008437156677246094, -0.007535457611083984, -0.006633758544921875, -0.005732059478759766, -0.004830360412597656, -0.003928661346435547, -0.0030269622802734375, -0.002125263214111328, -0.0012235641479492188, -0.0003218650817871094, 0.000579833984375, 0.0014815330505371094, 0.0023832321166992188, 0.003284931182861328, 0.0041866302490234375, 0.005088329315185547, 0.005990028381347656, 0.006891727447509766, 0.007793426513671875, 0.008695125579833984, 0.009596824645996094, 0.010498523712158203, 0.011400222778320312, 0.012301921844482422, 0.013203620910644531, 0.01410531997680664, 0.01500701904296875, 0.01590871810913086, 0.01681041717529297, 0.017712116241455078, 0.018613815307617188, 0.019515514373779297, 0.020417213439941406, 0.021318912506103516, 0.022220611572265625, 0.023122310638427734, 0.024024009704589844, 0.024925708770751953, 0.025827407836914062, 0.026729106903076172, 0.02763080596923828, 0.02853250503540039, 0.0294342041015625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 162.0, 854.0], "bins": [-0.027364365756511688, -0.026931503787636757, -0.026498641818761826, -0.026065779849886894, -0.025632917881011963, -0.025200054049491882, -0.02476719208061695, -0.02433433011174202, -0.02390146814286709, -0.023468606173992157, -0.023035744205117226, -0.022602882236242294, -0.022170020267367363, -0.02173715829849243, -0.02130429446697235, -0.02087143249809742, -0.02043857052922249, -0.020005708560347557, -0.019572846591472626, -0.019139984622597694, -0.018707122653722763, -0.018274258822202682, -0.01784139685332775, -0.01740853488445282, -0.01697567291557789, -0.016542810946702957, -0.016109948977828026, -0.015677087008953094, -0.015244224108755589, -0.014811362139880657, -0.014378500171005726, -0.01394563727080822, -0.013512775301933289, -0.013079913333058357, -0.012647051364183426, -0.01221418846398592, -0.011781326495110989, -0.011348464526236057, -0.010915602557361126, -0.01048273965716362, -0.010049878619611263, -0.009617016650736332, -0.0091841546818614, -0.008751291781663895, -0.008318429812788963, -0.007885567843914032, -0.007452705875039101, -0.007019843440502882, -0.006586981005966663, -0.006154119037091732, -0.005721256602555513, -0.005288394633680582, -0.004855532199144363, -0.004422670230269432, -0.003989808261394501, -0.003556945826858282, -0.003124083625152707, -0.002691221423447132, -0.002258359221741557, -0.001825497136451304, -0.001392634934745729, -0.0009597728494554758, -0.0005269106477499008, -9.404844604432583e-05, 0.0003388137847650796]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 3.0, 8.0, 11.0, 16.0, 24.0, 26.0, 19.0, 32.0, 34.0, 55.0, 37.0, 56.0, 42.0, 45.0, 49.0, 58.0, 38.0, 65.0, 53.0, 53.0, 31.0, 42.0, 35.0, 29.0, 23.0, 29.0, 21.0, 14.0, 17.0, 9.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005638003349304199, -0.0005384916439652443, -0.0005131829530000687, -0.00048787426203489304, -0.0004625655710697174, -0.0004372568801045418, -0.00041194818913936615, -0.0003866394981741905, -0.0003613308072090149, -0.00033602211624383926, -0.00031071342527866364, -0.000285404734313488, -0.0002600960433483124, -0.00023478735238313675, -0.00020947866141796112, -0.0001841699704527855, -0.00015886127948760986, -0.00013355258852243423, -0.0001082438975572586, -8.293520659208298e-05, -5.762651562690735e-05, -3.231782466173172e-05, -7.009133696556091e-06, 1.8299557268619537e-05, 4.3608248233795166e-05, 6.89169391989708e-05, 9.422563016414642e-05, 0.00011953432112932205, 0.00014484301209449768, 0.0001701517030596733, 0.00019546039402484894, 0.00022076908499002457, 0.0002460777759552002, 0.0002713864669203758, 0.00029669515788555145, 0.0003220038488507271, 0.0003473125398159027, 0.00037262123078107834, 0.00039792992174625397, 0.0004232386127114296, 0.0004485473036766052, 0.00047385599464178085, 0.0004991646856069565, 0.0005244733765721321, 0.0005497820675373077, 0.0005750907585024834, 0.000600399449467659, 0.0006257081404328346, 0.0006510168313980103, 0.0006763255223631859, 0.0007016342133283615, 0.0007269429042935371, 0.0007522515952587128, 0.0007775602862238884, 0.000802868977189064, 0.0008281776681542397, 0.0008534863591194153, 0.0008787950500845909, 0.0009041037410497665, 0.0009294124320149422, 0.0009547211229801178, 0.0009800298139452934, 0.001005338504910469, 0.0010306471958756447, 0.0010559558868408203]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 2.0, 5.0, 11.0, 12.0, 21.0, 23.0, 23.0, 21.0, 30.0, 29.0, 33.0, 26.0, 21.0, 34.0, 39.0, 45.0, 50.0, 39.0, 41.0, 43.0, 43.0, 45.0, 37.0, 34.0, 29.0, 37.0, 38.0, 20.0, 21.0, 21.0, 18.0, 21.0, 13.0, 14.0, 5.0, 13.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0], "bins": [-4.859375, -4.734893798828125, -4.61041259765625, -4.485931396484375, -4.3614501953125, -4.236968994140625, -4.11248779296875, -3.988006591796875, -3.863525390625, -3.739044189453125, -3.61456298828125, -3.490081787109375, -3.3656005859375, -3.241119384765625, -3.11663818359375, -2.992156982421875, -2.86767578125, -2.743194580078125, -2.61871337890625, -2.494232177734375, -2.3697509765625, -2.245269775390625, -2.12078857421875, -1.996307373046875, -1.871826171875, -1.747344970703125, -1.62286376953125, -1.498382568359375, -1.3739013671875, -1.249420166015625, -1.12493896484375, -1.000457763671875, -0.8759765625, -0.751495361328125, -0.62701416015625, -0.502532958984375, -0.3780517578125, -0.253570556640625, -0.12908935546875, -0.004608154296875, 0.119873046875, 0.244354248046875, 0.36883544921875, 0.493316650390625, 0.6177978515625, 0.742279052734375, 0.86676025390625, 0.991241455078125, 1.11572265625, 1.240203857421875, 1.36468505859375, 1.489166259765625, 1.6136474609375, 1.738128662109375, 1.86260986328125, 1.987091064453125, 2.111572265625, 2.236053466796875, 2.36053466796875, 2.485015869140625, 2.6094970703125, 2.733978271484375, 2.85845947265625, 2.982940673828125, 3.107421875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 20.0, 27.0, 38.0, 52.0, 90.0, 135.0, 181.0, 303.0, 464.0, 690.0, 1112.0, 1639.0, 2829.0, 4329.0, 7318.0, 14322.0, 32804.0, 91854.0, 379489.0, 358623.0, 87578.0, 31636.0, 13922.0, 7313.0, 4348.0, 2597.0, 1685.0, 1081.0, 712.0, 473.0, 306.0, 205.0, 127.0, 77.0, 48.0, 26.0, 33.0, 11.0, 8.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.666015625, -3.539520263671875, -3.41302490234375, -3.286529541015625, -3.1600341796875, -3.033538818359375, -2.90704345703125, -2.780548095703125, -2.654052734375, -2.527557373046875, -2.40106201171875, -2.274566650390625, -2.1480712890625, -2.021575927734375, -1.89508056640625, -1.768585205078125, -1.64208984375, -1.515594482421875, -1.38909912109375, -1.262603759765625, -1.1361083984375, -1.009613037109375, -0.88311767578125, -0.756622314453125, -0.630126953125, -0.503631591796875, -0.37713623046875, -0.250640869140625, -0.1241455078125, 0.002349853515625, 0.12884521484375, 0.255340576171875, 0.3818359375, 0.508331298828125, 0.63482666015625, 0.761322021484375, 0.8878173828125, 1.014312744140625, 1.14080810546875, 1.267303466796875, 1.393798828125, 1.520294189453125, 1.64678955078125, 1.773284912109375, 1.8997802734375, 2.026275634765625, 2.15277099609375, 2.279266357421875, 2.40576171875, 2.532257080078125, 2.65875244140625, 2.785247802734375, 2.9117431640625, 3.038238525390625, 3.16473388671875, 3.291229248046875, 3.417724609375, 3.544219970703125, 3.67071533203125, 3.797210693359375, 3.9237060546875, 4.050201416015625, 4.17669677734375, 4.303192138671875, 4.4296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 14.0, 11.0, 9.0, 18.0, 14.0, 21.0, 27.0, 27.0, 34.0, 24.0, 36.0, 37.0, 34.0, 53.0, 59.0, 92.0, 300.0, 1595.0, 127.0, 85.0, 46.0, 48.0, 36.0, 44.0, 34.0, 36.0, 26.0, 22.0, 20.0, 11.0, 15.0, 12.0, 14.0, 6.0, 7.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.125, -13.712890625, -13.30078125, -12.888671875, -12.4765625, -12.064453125, -11.65234375, -11.240234375, -10.828125, -10.416015625, -10.00390625, -9.591796875, -9.1796875, -8.767578125, -8.35546875, -7.943359375, -7.53125, -7.119140625, -6.70703125, -6.294921875, -5.8828125, -5.470703125, -5.05859375, -4.646484375, -4.234375, -3.822265625, -3.41015625, -2.998046875, -2.5859375, -2.173828125, -1.76171875, -1.349609375, -0.9375, -0.525390625, -0.11328125, 0.298828125, 0.7109375, 1.123046875, 1.53515625, 1.947265625, 2.359375, 2.771484375, 3.18359375, 3.595703125, 4.0078125, 4.419921875, 4.83203125, 5.244140625, 5.65625, 6.068359375, 6.48046875, 6.892578125, 7.3046875, 7.716796875, 8.12890625, 8.541015625, 8.953125, 9.365234375, 9.77734375, 10.189453125, 10.6015625, 11.013671875, 11.42578125, 11.837890625, 12.25]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 9.0, 3.0, 4.0, 4.0, 7.0, 18.0, 19.0, 26.0, 31.0, 49.0, 82.0, 134.0, 214.0, 345.0, 1069.0, 15103.0, 3053943.0, 71105.0, 2256.0, 477.0, 269.0, 157.0, 112.0, 61.0, 47.0, 35.0, 37.0, 19.0, 20.0, 15.0, 9.0, 7.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -34.32275390625, -33.2392578125, -32.15576171875, -31.072265625, -29.98876953125, -28.9052734375, -27.82177734375, -26.73828125, -25.65478515625, -24.5712890625, -23.48779296875, -22.404296875, -21.32080078125, -20.2373046875, -19.15380859375, -18.0703125, -16.98681640625, -15.9033203125, -14.81982421875, -13.736328125, -12.65283203125, -11.5693359375, -10.48583984375, -9.40234375, -8.31884765625, -7.2353515625, -6.15185546875, -5.068359375, -3.98486328125, -2.9013671875, -1.81787109375, -0.734375, 0.34912109375, 1.4326171875, 2.51611328125, 3.599609375, 4.68310546875, 5.7666015625, 6.85009765625, 7.93359375, 9.01708984375, 10.1005859375, 11.18408203125, 12.267578125, 13.35107421875, 14.4345703125, 15.51806640625, 16.6015625, 17.68505859375, 18.7685546875, 19.85205078125, 20.935546875, 22.01904296875, 23.1025390625, 24.18603515625, 25.26953125, 26.35302734375, 27.4365234375, 28.52001953125, 29.603515625, 30.68701171875, 31.7705078125, 32.85400390625, 33.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 21.0, 88.0, 232.0, 316.0, 228.0, 94.0, 26.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.308319091796875, -5.9836273193359375, -4.658935546875, -3.3342432975769043, -2.009551525115967, -0.6848597526550293, 0.6398324966430664, 1.964524269104004, 3.2892160415649414, 4.613907814025879, 5.938599586486816, 7.263291835784912, 8.587984085083008, 9.912675857543945, 11.237367630004883, 12.56205940246582, 13.886751174926758, 15.211442947387695, 16.536134719848633, 17.86082649230957, 19.185518264770508, 20.510210037231445, 21.834903717041016, 23.159595489501953, 24.48428726196289, 25.808979034423828, 27.133670806884766, 28.458362579345703, 29.78305435180664, 31.107746124267578, 32.432437896728516, 33.75712966918945, 35.08182144165039, 36.40651321411133, 37.731204986572266, 39.0558967590332, 40.38058853149414, 41.70528030395508, 43.029972076416016, 44.35466384887695, 45.67935562133789, 47.00404739379883, 48.328739166259766, 49.6534309387207, 50.97812271118164, 52.30281448364258, 53.627506256103516, 54.95219802856445, 56.276893615722656, 57.601585388183594, 58.92627716064453, 60.25096893310547, 61.575660705566406, 62.900352478027344, 64.22504425048828, 65.54973602294922, 66.87442779541016, 68.1991195678711, 69.52381134033203, 70.84850311279297, 72.1731948852539, 73.49788665771484, 74.82257843017578, 76.14727020263672, 77.47196197509766]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 2.0, 8.0, 7.0, 18.0, 16.0, 22.0, 19.0, 19.0, 25.0, 27.0, 29.0, 28.0, 19.0, 37.0, 33.0, 37.0, 30.0, 46.0, 34.0, 36.0, 38.0, 45.0, 41.0, 36.0, 34.0, 35.0, 35.0, 33.0, 19.0, 28.0, 29.0, 17.0, 17.0, 16.0, 20.0, 11.0, 14.0, 4.0, 6.0, 8.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.70394515991211, -34.50711441040039, -33.31028366088867, -32.11345291137695, -30.9166202545166, -29.719789505004883, -28.52295684814453, -27.326126098632812, -26.129295349121094, -24.932464599609375, -23.735633850097656, -22.538801193237305, -21.341970443725586, -20.145139694213867, -18.948307037353516, -17.751476287841797, -16.554645538330078, -15.35781478881836, -14.160983085632324, -12.964151382446289, -11.76732063293457, -10.570489883422852, -9.373658180236816, -8.176826477050781, -6.9799957275390625, -5.7831645011901855, -4.586333274841309, -3.3895020484924316, -2.1926708221435547, -0.9958395957946777, 0.20099163055419922, 1.3978233337402344, 2.5946578979492188, 3.7914891242980957, 4.988320350646973, 6.18515157699585, 7.381982803344727, 8.578813552856445, 9.77564525604248, 10.972476959228516, 12.169307708740234, 13.366138458251953, 14.562970161437988, 15.759801864624023, 16.956632614135742, 18.15346336364746, 19.350296020507812, 20.54712677001953, 21.74395751953125, 22.94078826904297, 24.137619018554688, 25.33445167541504, 26.531282424926758, 27.728113174438477, 28.924945831298828, 30.121776580810547, 31.318607330322266, 32.515438079833984, 33.7122688293457, 34.90909957885742, 36.105934143066406, 37.302764892578125, 38.499595642089844, 39.69642639160156, 40.89325714111328]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 3.0, 6.0, 8.0, 12.0, 16.0, 14.0, 19.0, 20.0, 34.0, 27.0, 27.0, 36.0, 38.0, 28.0, 31.0, 43.0, 38.0, 49.0, 54.0, 54.0, 38.0, 40.0, 31.0, 32.0, 41.0, 33.0, 33.0, 30.0, 24.0, 20.0, 26.0, 18.0, 13.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0], "bins": [-5.26171875, -5.128204345703125, -4.99468994140625, -4.861175537109375, -4.7276611328125, -4.594146728515625, -4.46063232421875, -4.327117919921875, -4.193603515625, -4.060089111328125, -3.92657470703125, -3.793060302734375, -3.6595458984375, -3.526031494140625, -3.39251708984375, -3.259002685546875, -3.12548828125, -2.991973876953125, -2.85845947265625, -2.724945068359375, -2.5914306640625, -2.457916259765625, -2.32440185546875, -2.190887451171875, -2.057373046875, -1.923858642578125, -1.79034423828125, -1.656829833984375, -1.5233154296875, -1.389801025390625, -1.25628662109375, -1.122772216796875, -0.9892578125, -0.855743408203125, -0.72222900390625, -0.588714599609375, -0.4552001953125, -0.321685791015625, -0.18817138671875, -0.054656982421875, 0.078857421875, 0.212371826171875, 0.34588623046875, 0.479400634765625, 0.6129150390625, 0.746429443359375, 0.87994384765625, 1.013458251953125, 1.14697265625, 1.280487060546875, 1.41400146484375, 1.547515869140625, 1.6810302734375, 1.814544677734375, 1.94805908203125, 2.081573486328125, 2.215087890625, 2.348602294921875, 2.48211669921875, 2.615631103515625, 2.7491455078125, 2.882659912109375, 3.01617431640625, 3.149688720703125, 3.283203125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 17.0, 19.0, 27.0, 31.0, 56.0, 121.0, 157.0, 293.0, 524.0, 1056.0, 2179.0, 4934.0, 12340.0, 31836.0, 93180.0, 329710.0, 1084018.0, 1573201.0, 746667.0, 211548.0, 63907.0, 22695.0, 8924.0, 3631.0, 1560.0, 712.0, 374.0, 212.0, 98.0, 84.0, 60.0, 30.0, 20.0, 18.0, 12.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.43609619140625, -6.2589111328125, -6.08172607421875, -5.904541015625, -5.72735595703125, -5.5501708984375, -5.37298583984375, -5.19580078125, -5.01861572265625, -4.8414306640625, -4.66424560546875, -4.487060546875, -4.30987548828125, -4.1326904296875, -3.95550537109375, -3.7783203125, -3.60113525390625, -3.4239501953125, -3.24676513671875, -3.069580078125, -2.89239501953125, -2.7152099609375, -2.53802490234375, -2.36083984375, -2.18365478515625, -2.0064697265625, -1.82928466796875, -1.652099609375, -1.47491455078125, -1.2977294921875, -1.12054443359375, -0.943359375, -0.76617431640625, -0.5889892578125, -0.41180419921875, -0.234619140625, -0.05743408203125, 0.1197509765625, 0.29693603515625, 0.47412109375, 0.65130615234375, 0.8284912109375, 1.00567626953125, 1.182861328125, 1.36004638671875, 1.5372314453125, 1.71441650390625, 1.8916015625, 2.06878662109375, 2.2459716796875, 2.42315673828125, 2.600341796875, 2.77752685546875, 2.9547119140625, 3.13189697265625, 3.30908203125, 3.48626708984375, 3.6634521484375, 3.84063720703125, 4.017822265625, 4.19500732421875, 4.3721923828125, 4.54937744140625, 4.7265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 9.0, 3.0, 8.0, 8.0, 6.0, 24.0, 31.0, 26.0, 39.0, 60.0, 68.0, 99.0, 148.0, 191.0, 230.0, 306.0, 362.0, 420.0, 392.0, 388.0, 277.0, 210.0, 194.0, 135.0, 114.0, 79.0, 72.0, 51.0, 34.0, 22.0, 15.0, 17.0, 11.0, 7.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.7265625, -10.3919677734375, -10.057373046875, -9.7227783203125, -9.38818359375, -9.0535888671875, -8.718994140625, -8.3843994140625, -8.0498046875, -7.7152099609375, -7.380615234375, -7.0460205078125, -6.71142578125, -6.3768310546875, -6.042236328125, -5.7076416015625, -5.373046875, -5.0384521484375, -4.703857421875, -4.3692626953125, -4.03466796875, -3.7000732421875, -3.365478515625, -3.0308837890625, -2.6962890625, -2.3616943359375, -2.027099609375, -1.6925048828125, -1.35791015625, -1.0233154296875, -0.688720703125, -0.3541259765625, -0.01953125, 0.3150634765625, 0.649658203125, 0.9842529296875, 1.31884765625, 1.6534423828125, 1.988037109375, 2.3226318359375, 2.6572265625, 2.9918212890625, 3.326416015625, 3.6610107421875, 3.99560546875, 4.3302001953125, 4.664794921875, 4.9993896484375, 5.333984375, 5.6685791015625, 6.003173828125, 6.3377685546875, 6.67236328125, 7.0069580078125, 7.341552734375, 7.6761474609375, 8.0107421875, 8.3453369140625, 8.679931640625, 9.0145263671875, 9.34912109375, 9.6837158203125, 10.018310546875, 10.3529052734375, 10.6875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 13.0, 12.0, 15.0, 20.0, 35.0, 44.0, 52.0, 75.0, 120.0, 117.0, 253.0, 532.0, 1979.0, 27546.0, 1966963.0, 2162929.0, 30206.0, 2148.0, 504.0, 217.0, 141.0, 99.0, 77.0, 46.0, 31.0, 21.0, 24.0, 7.0, 14.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.25, -36.15478515625, -35.0595703125, -33.96435546875, -32.869140625, -31.77392578125, -30.6787109375, -29.58349609375, -28.48828125, -27.39306640625, -26.2978515625, -25.20263671875, -24.107421875, -23.01220703125, -21.9169921875, -20.82177734375, -19.7265625, -18.63134765625, -17.5361328125, -16.44091796875, -15.345703125, -14.25048828125, -13.1552734375, -12.06005859375, -10.96484375, -9.86962890625, -8.7744140625, -7.67919921875, -6.583984375, -5.48876953125, -4.3935546875, -3.29833984375, -2.203125, -1.10791015625, -0.0126953125, 1.08251953125, 2.177734375, 3.27294921875, 4.3681640625, 5.46337890625, 6.55859375, 7.65380859375, 8.7490234375, 9.84423828125, 10.939453125, 12.03466796875, 13.1298828125, 14.22509765625, 15.3203125, 16.41552734375, 17.5107421875, 18.60595703125, 19.701171875, 20.79638671875, 21.8916015625, 22.98681640625, 24.08203125, 25.17724609375, 26.2724609375, 27.36767578125, 28.462890625, 29.55810546875, 30.6533203125, 31.74853515625, 32.84375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 12.0, 30.0, 32.0, 67.0, 111.0, 134.0, 181.0, 174.0, 110.0, 85.0, 38.0, 18.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-117.48446655273438, -115.06231689453125, -112.64017486572266, -110.21802520751953, -107.79588317871094, -105.37373352050781, -102.95158386230469, -100.5294418334961, -98.10729217529297, -95.68514251708984, -93.26300048828125, -90.84085083007812, -88.41870880126953, -85.9965591430664, -83.57441711425781, -81.15226745605469, -78.73011779785156, -76.30796813964844, -73.88582611083984, -71.46367645263672, -69.04153442382812, -66.619384765625, -64.19723510742188, -61.77509307861328, -59.35295104980469, -56.93080520629883, -54.50865936279297, -52.086509704589844, -49.664363861083984, -47.242218017578125, -44.820072174072266, -42.397926330566406, -39.97577667236328, -37.55363082885742, -35.13148498535156, -32.70933532714844, -30.287189483642578, -27.86504364013672, -25.44289779663086, -23.020750045776367, -20.598604202270508, -18.17645835876465, -15.754310607910156, -13.332164764404297, -10.910017967224121, -8.487871170043945, -6.065725326538086, -3.6435775756835938, -1.2214317321777344, 1.2007148265838623, 3.622861385345459, 6.045007705688477, 8.467154502868652, 10.889301300048828, 13.311447143554688, 15.73359489440918, 18.15574073791504, 20.5778865814209, 23.00003433227539, 25.42218017578125, 27.84432601928711, 30.2664737701416, 32.688621520996094, 35.11076736450195, 37.53291320800781]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 4.0, 7.0, 12.0, 9.0, 12.0, 15.0, 15.0, 27.0, 20.0, 21.0, 29.0, 29.0, 30.0, 36.0, 42.0, 46.0, 49.0, 34.0, 37.0, 55.0, 39.0, 37.0, 39.0, 48.0, 28.0, 30.0, 39.0, 32.0, 23.0, 27.0, 20.0, 16.0, 13.0, 18.0, 16.0, 16.0, 10.0, 8.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.1024169921875, -38.86738967895508, -37.63235855102539, -36.39733123779297, -35.16230010986328, -33.92727279663086, -32.69224548339844, -31.45721435546875, -30.222187042236328, -28.987157821655273, -27.75212860107422, -26.517101287841797, -25.282072067260742, -24.047042846679688, -22.812013626098633, -21.576984405517578, -20.341955184936523, -19.10692596435547, -17.871896743774414, -16.63686752319336, -15.401840209960938, -14.166810989379883, -12.931781768798828, -11.69675350189209, -10.461724281311035, -9.22669506072998, -7.991666793823242, -6.7566375732421875, -5.521608829498291, -4.2865800857543945, -3.05155086517334, -1.8165225982666016, -0.5814933776855469, 0.6535354852676392, 1.8885643482208252, 3.123593330383301, 4.358622074127197, 5.593650817871094, 6.828680038452148, 8.063708305358887, 9.298737525939941, 10.533766746520996, 11.768795013427734, 13.003824234008789, 14.238853454589844, 15.473881721496582, 16.708911895751953, 17.943939208984375, 19.17896842956543, 20.413997650146484, 21.64902687072754, 22.884056091308594, 24.119083404541016, 25.35411262512207, 26.589141845703125, 27.824169158935547, 29.059200286865234, 30.29422950744629, 31.529258728027344, 32.764286041259766, 33.99931716918945, 35.234344482421875, 36.46937561035156, 37.704402923583984, 38.939430236816406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 7.0, 11.0, 13.0, 5.0, 15.0, 28.0, 23.0, 25.0, 35.0, 36.0, 31.0, 36.0, 35.0, 35.0, 33.0, 45.0, 50.0, 52.0, 45.0, 43.0, 48.0, 52.0, 34.0, 34.0, 33.0, 37.0, 24.0, 23.0, 19.0, 11.0, 12.0, 13.0, 13.0, 10.0, 9.0, 10.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.78125, -5.633636474609375, -5.48602294921875, -5.338409423828125, -5.1907958984375, -5.043182373046875, -4.89556884765625, -4.747955322265625, -4.600341796875, -4.452728271484375, -4.30511474609375, -4.157501220703125, -4.0098876953125, -3.862274169921875, -3.71466064453125, -3.567047119140625, -3.41943359375, -3.271820068359375, -3.12420654296875, -2.976593017578125, -2.8289794921875, -2.681365966796875, -2.53375244140625, -2.386138916015625, -2.238525390625, -2.090911865234375, -1.94329833984375, -1.795684814453125, -1.6480712890625, -1.500457763671875, -1.35284423828125, -1.205230712890625, -1.0576171875, -0.910003662109375, -0.76239013671875, -0.614776611328125, -0.4671630859375, -0.319549560546875, -0.17193603515625, -0.024322509765625, 0.123291015625, 0.270904541015625, 0.41851806640625, 0.566131591796875, 0.7137451171875, 0.861358642578125, 1.00897216796875, 1.156585693359375, 1.30419921875, 1.451812744140625, 1.59942626953125, 1.747039794921875, 1.8946533203125, 2.042266845703125, 2.18988037109375, 2.337493896484375, 2.485107421875, 2.632720947265625, 2.78033447265625, 2.927947998046875, 3.0755615234375, 3.223175048828125, 3.37078857421875, 3.518402099609375, 3.666015625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 17.0, 14.0, 27.0, 30.0, 40.0, 84.0, 133.0, 194.0, 267.0, 413.0, 655.0, 1001.0, 1514.0, 2380.0, 3773.0, 6036.0, 9738.0, 15785.0, 26294.0, 44957.0, 77196.0, 134421.0, 207793.0, 203293.0, 128703.0, 74086.0, 43523.0, 25194.0, 15367.0, 9331.0, 5810.0, 3715.0, 2268.0, 1572.0, 1005.0, 616.0, 423.0, 298.0, 190.0, 122.0, 88.0, 70.0, 37.0, 25.0, 19.0, 9.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.5546875, -0.5383567810058594, -0.5220260620117188, -0.5056953430175781, -0.4893646240234375, -0.4730339050292969, -0.45670318603515625, -0.4403724670410156, -0.424041748046875, -0.4077110290527344, -0.39138031005859375, -0.3750495910644531, -0.3587188720703125, -0.3423881530761719, -0.32605743408203125, -0.3097267150878906, -0.29339599609375, -0.2770652770996094, -0.26073455810546875, -0.24440383911132812, -0.2280731201171875, -0.21174240112304688, -0.19541168212890625, -0.17908096313476562, -0.162750244140625, -0.14641952514648438, -0.13008880615234375, -0.11375808715820312, -0.0974273681640625, -0.08109664916992188, -0.06476593017578125, -0.048435211181640625, -0.0321044921875, -0.015773773193359375, 0.00055694580078125, 0.016887664794921875, 0.0332183837890625, 0.049549102783203125, 0.06587982177734375, 0.08221054077148438, 0.098541259765625, 0.11487197875976562, 0.13120269775390625, 0.14753341674804688, 0.1638641357421875, 0.18019485473632812, 0.19652557373046875, 0.21285629272460938, 0.22918701171875, 0.24551773071289062, 0.26184844970703125, 0.2781791687011719, 0.2945098876953125, 0.3108406066894531, 0.32717132568359375, 0.3435020446777344, 0.359832763671875, 0.3761634826660156, 0.39249420166015625, 0.4088249206542969, 0.4251556396484375, 0.4414863586425781, 0.45781707763671875, 0.4741477966308594, 0.490478515625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 9.0, 11.0, 9.0, 24.0, 16.0, 21.0, 18.0, 21.0, 28.0, 22.0, 21.0, 33.0, 35.0, 37.0, 36.0, 35.0, 42.0, 38.0, 1058.0, 42.0, 47.0, 34.0, 28.0, 24.0, 31.0, 39.0, 27.0, 32.0, 20.0, 24.0, 22.0, 19.0, 11.0, 16.0, 12.0, 10.0, 11.0, 7.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0], "bins": [-2.728515625, -2.6475830078125, -2.566650390625, -2.4857177734375, -2.40478515625, -2.3238525390625, -2.242919921875, -2.1619873046875, -2.0810546875, -2.0001220703125, -1.919189453125, -1.8382568359375, -1.75732421875, -1.6763916015625, -1.595458984375, -1.5145263671875, -1.43359375, -1.3526611328125, -1.271728515625, -1.1907958984375, -1.10986328125, -1.0289306640625, -0.947998046875, -0.8670654296875, -0.7861328125, -0.7052001953125, -0.624267578125, -0.5433349609375, -0.46240234375, -0.3814697265625, -0.300537109375, -0.2196044921875, -0.138671875, -0.0577392578125, 0.023193359375, 0.1041259765625, 0.18505859375, 0.2659912109375, 0.346923828125, 0.4278564453125, 0.5087890625, 0.5897216796875, 0.670654296875, 0.7515869140625, 0.83251953125, 0.9134521484375, 0.994384765625, 1.0753173828125, 1.15625, 1.2371826171875, 1.318115234375, 1.3990478515625, 1.47998046875, 1.5609130859375, 1.641845703125, 1.7227783203125, 1.8037109375, 1.8846435546875, 1.965576171875, 2.0465087890625, 2.12744140625, 2.2083740234375, 2.289306640625, 2.3702392578125, 2.451171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 3.0, 8.0, 12.0, 26.0, 39.0, 57.0, 77.0, 107.0, 148.0, 257.0, 396.0, 651.0, 877.0, 1532.0, 2418.0, 4068.0, 6662.0, 11112.0, 18745.0, 31688.0, 54881.0, 95154.0, 154544.0, 1249419.0, 179063.0, 118224.0, 69401.0, 39824.0, 23173.0, 13494.0, 8187.0, 4920.0, 2959.0, 1846.0, 1102.0, 759.0, 441.0, 296.0, 204.0, 123.0, 74.0, 45.0, 41.0, 28.0, 16.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3165168762207031, -0.30466461181640625, -0.2928123474121094, -0.2809600830078125, -0.2691078186035156, -0.25725555419921875, -0.24540328979492188, -0.233551025390625, -0.22169876098632812, -0.20984649658203125, -0.19799423217773438, -0.1861419677734375, -0.17428970336914062, -0.16243743896484375, -0.15058517456054688, -0.13873291015625, -0.12688064575195312, -0.11502838134765625, -0.10317611694335938, -0.0913238525390625, -0.07947158813476562, -0.06761932373046875, -0.055767059326171875, -0.043914794921875, -0.032062530517578125, -0.02021026611328125, -0.008358001708984375, 0.0034942626953125, 0.015346527099609375, 0.02719879150390625, 0.039051055908203125, 0.0509033203125, 0.06275558471679688, 0.07460784912109375, 0.08646011352539062, 0.0983123779296875, 0.11016464233398438, 0.12201690673828125, 0.13386917114257812, 0.145721435546875, 0.15757369995117188, 0.16942596435546875, 0.18127822875976562, 0.1931304931640625, 0.20498275756835938, 0.21683502197265625, 0.22868728637695312, 0.24053955078125, 0.2523918151855469, 0.26424407958984375, 0.2760963439941406, 0.2879486083984375, 0.2998008728027344, 0.31165313720703125, 0.3235054016113281, 0.335357666015625, 0.3472099304199219, 0.35906219482421875, 0.3709144592285156, 0.3827667236328125, 0.3946189880371094, 0.40647125244140625, 0.4183235168457031, 0.43017578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 11.0, 12.0, 9.0, 22.0, 23.0, 31.0, 32.0, 32.0, 41.0, 49.0, 60.0, 49.0, 65.0, 78.0, 63.0, 54.0, 52.0, 45.0, 47.0, 33.0, 29.0, 36.0, 20.0, 15.0, 14.0, 21.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013685226440429688, -0.0013308972120285034, -0.001293271780014038, -0.0012556463479995728, -0.0012180209159851074, -0.001180395483970642, -0.0011427700519561768, -0.0011051446199417114, -0.001067519187927246, -0.0010298937559127808, -0.0009922683238983154, -0.0009546428918838501, -0.0009170174598693848, -0.0008793920278549194, -0.0008417665958404541, -0.0008041411638259888, -0.0007665157318115234, -0.0007288902997970581, -0.0006912648677825928, -0.0006536394357681274, -0.0006160140037536621, -0.0005783885717391968, -0.0005407631397247314, -0.0005031377077102661, -0.0004655122756958008, -0.00042788684368133545, -0.0003902614116668701, -0.0003526359796524048, -0.00031501054763793945, -0.0002773851156234741, -0.0002397596836090088, -0.00020213425159454346, -0.00016450881958007812, -0.0001268833875656128, -8.925795555114746e-05, -5.163252353668213e-05, -1.4007091522216797e-05, 2.3618340492248535e-05, 6.124377250671387e-05, 9.88692045211792e-05, 0.00013649463653564453, 0.00017412006855010986, 0.0002117455005645752, 0.00024937093257904053, 0.00028699636459350586, 0.0003246217966079712, 0.0003622472286224365, 0.00039987266063690186, 0.0004374980926513672, 0.0004751235246658325, 0.0005127489566802979, 0.0005503743886947632, 0.0005879998207092285, 0.0006256252527236938, 0.0006632506847381592, 0.0007008761167526245, 0.0007385015487670898, 0.0007761269807815552, 0.0008137524127960205, 0.0008513778448104858, 0.0008890032768249512, 0.0009266287088394165, 0.0009642541408538818, 0.0010018795728683472, 0.0010395050048828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 4.0, 8.0, 4.0, 14.0, 16.0, 20.0, 15.0, 19.0, 42.0, 40.0, 61.0, 83.0, 104.0, 190.0, 319.0, 527.0, 2227.0, 356925.0, 682796.0, 3490.0, 637.0, 324.0, 188.0, 139.0, 80.0, 65.0, 47.0, 49.0, 28.0, 20.0, 12.0, 9.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0224609375, -0.02178192138671875, -0.0211029052734375, -0.02042388916015625, -0.019744873046875, -0.01906585693359375, -0.0183868408203125, -0.01770782470703125, -0.01702880859375, -0.01634979248046875, -0.0156707763671875, -0.01499176025390625, -0.014312744140625, -0.01363372802734375, -0.0129547119140625, -0.01227569580078125, -0.0115966796875, -0.01091766357421875, -0.0102386474609375, -0.00955963134765625, -0.008880615234375, -0.00820159912109375, -0.0075225830078125, -0.00684356689453125, -0.00616455078125, -0.00548553466796875, -0.0048065185546875, -0.00412750244140625, -0.003448486328125, -0.00276947021484375, -0.0020904541015625, -0.00141143798828125, -0.000732421875, -5.340576171875e-05, 0.0006256103515625, 0.00130462646484375, 0.001983642578125, 0.00266265869140625, 0.0033416748046875, 0.00402069091796875, 0.00469970703125, 0.00537872314453125, 0.0060577392578125, 0.00673675537109375, 0.007415771484375, 0.00809478759765625, 0.0087738037109375, 0.00945281982421875, 0.0101318359375, 0.01081085205078125, 0.0114898681640625, 0.01216888427734375, 0.012847900390625, 0.01352691650390625, 0.0142059326171875, 0.01488494873046875, 0.01556396484375, 0.01624298095703125, 0.0169219970703125, 0.01760101318359375, 0.018280029296875, 0.01895904541015625, 0.0196380615234375, 0.02031707763671875, 0.02099609375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 6.0, 10.0, 33.0, 52.0, 71.0, 101.0, 143.0, 140.0, 133.0, 136.0, 77.0, 49.0, 24.0, 16.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010579447261989117, -0.0010209851898252964, -0.0009840256534516811, -0.0009470661170780659, -0.0009101065807044506, -0.0008731470443308353, -0.0008361875079572201, -0.0007992279715836048, -0.0007622684352099895, -0.0007253088988363743, -0.000688349362462759, -0.0006513898260891438, -0.0006144302897155285, -0.0005774707533419132, -0.000540511216968298, -0.0005035516805946827, -0.0004665920860134065, -0.00042963254963979125, -0.000392673013266176, -0.0003557134768925607, -0.00031875394051894546, -0.0002817944041453302, -0.00024483483866788447, -0.0002078753022942692, -0.00017091576592065394, -0.00013395622954703867, -9.69966858974658e-05, -6.0037142247892916e-05, -2.307760587427765e-05, 1.3881930499337614e-05, 5.084148142486811e-05, 8.780101779848337e-05, 0.00012476055417209864, 0.0001617200905457139, 0.00019867962691932917, 0.00023563917784485966, 0.0002725986996665597, 0.00030955823604017496, 0.0003465178015176207, 0.00038347733789123595, 0.0004204368742648512, 0.0004573964106384665, 0.0004943559761159122, 0.0005313155124895275, 0.0005682750488631427, 0.000605234585236758, 0.0006421941216103733, 0.0006791536579839885, 0.0007161131943576038, 0.000753072730731219, 0.0007900322671048343, 0.0008269918034784496, 0.0008639513398520648, 0.0009009108762256801, 0.0009378704708069563, 0.0009748300071805716, 0.0010117895435541868, 0.001048749079927802, 0.0010857086163014174, 0.0011226681526750326, 0.0011596276890486479, 0.0011965872254222631, 0.0012335467617958784, 0.0012705062981694937, 0.001307465834543109]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 10.0, 13.0, 19.0, 15.0, 14.0, 34.0, 27.0, 19.0, 21.0, 34.0, 40.0, 36.0, 34.0, 44.0, 47.0, 41.0, 45.0, 51.0, 48.0, 31.0, 30.0, 43.0, 30.0, 40.0, 32.0, 29.0, 27.0, 21.0, 23.0, 19.0, 25.0, 8.0, 14.0, 9.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0006729364395141602, -0.0006530098617076874, -0.0006330832839012146, -0.0006131567060947418, -0.000593230128288269, -0.0005733035504817963, -0.0005533769726753235, -0.0005334503948688507, -0.0005135238170623779, -0.0004935972392559052, -0.0004736706614494324, -0.0004537440836429596, -0.0004338175058364868, -0.00041389092803001404, -0.00039396435022354126, -0.0003740377724170685, -0.0003541111946105957, -0.0003341846168041229, -0.00031425803899765015, -0.00029433146119117737, -0.0002744048833847046, -0.0002544783055782318, -0.00023455172777175903, -0.00021462514996528625, -0.00019469857215881348, -0.0001747719943523407, -0.00015484541654586792, -0.00013491883873939514, -0.00011499226093292236, -9.506568312644958e-05, -7.51391053199768e-05, -5.521252751350403e-05, -3.528594970703125e-05, -1.535937190055847e-05, 4.567205905914307e-06, 2.4493783712387085e-05, 4.442036151885986e-05, 6.434693932533264e-05, 8.427351713180542e-05, 0.0001042000949382782, 0.00012412667274475098, 0.00014405325055122375, 0.00016397982835769653, 0.0001839064061641693, 0.0002038329839706421, 0.00022375956177711487, 0.00024368613958358765, 0.0002636127173900604, 0.0002835392951965332, 0.000303465873003006, 0.00032339245080947876, 0.00034331902861595154, 0.0003632456064224243, 0.0003831721842288971, 0.0004030987620353699, 0.00042302533984184265, 0.00044295191764831543, 0.0004628784954547882, 0.000482805073261261, 0.0005027316510677338, 0.0005226582288742065, 0.0005425848066806793, 0.0005625113844871521, 0.0005824379622936249, 0.0006023645401000977]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 7.0, 11.0, 13.0, 5.0, 15.0, 28.0, 23.0, 25.0, 35.0, 36.0, 31.0, 36.0, 35.0, 35.0, 33.0, 45.0, 50.0, 52.0, 45.0, 43.0, 48.0, 52.0, 34.0, 34.0, 33.0, 37.0, 24.0, 23.0, 19.0, 11.0, 12.0, 13.0, 13.0, 10.0, 9.0, 10.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.78125, -5.633636474609375, -5.48602294921875, -5.338409423828125, -5.1907958984375, -5.043182373046875, -4.89556884765625, -4.747955322265625, -4.600341796875, -4.452728271484375, -4.30511474609375, -4.157501220703125, -4.0098876953125, -3.862274169921875, -3.71466064453125, -3.567047119140625, -3.41943359375, -3.271820068359375, -3.12420654296875, -2.976593017578125, -2.8289794921875, -2.681365966796875, -2.53375244140625, -2.386138916015625, -2.238525390625, -2.090911865234375, -1.94329833984375, -1.795684814453125, -1.6480712890625, -1.500457763671875, -1.35284423828125, -1.205230712890625, -1.0576171875, -0.910003662109375, -0.76239013671875, -0.614776611328125, -0.4671630859375, -0.319549560546875, -0.17193603515625, -0.024322509765625, 0.123291015625, 0.270904541015625, 0.41851806640625, 0.566131591796875, 0.7137451171875, 0.861358642578125, 1.00897216796875, 1.156585693359375, 1.30419921875, 1.451812744140625, 1.59942626953125, 1.747039794921875, 1.8946533203125, 2.042266845703125, 2.18988037109375, 2.337493896484375, 2.485107421875, 2.632720947265625, 2.78033447265625, 2.927947998046875, 3.0755615234375, 3.223175048828125, 3.37078857421875, 3.518402099609375, 3.666015625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 5.0, 9.0, 8.0, 20.0, 30.0, 48.0, 59.0, 108.0, 161.0, 234.0, 439.0, 689.0, 1236.0, 2444.0, 5141.0, 11774.0, 30220.0, 86073.0, 273014.0, 414308.0, 142145.0, 47961.0, 18118.0, 7113.0, 3264.0, 1658.0, 912.0, 489.0, 319.0, 185.0, 124.0, 95.0, 44.0, 32.0, 23.0, 15.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.80859375, -4.679412841796875, -4.55023193359375, -4.421051025390625, -4.2918701171875, -4.162689208984375, -4.03350830078125, -3.904327392578125, -3.775146484375, -3.645965576171875, -3.51678466796875, -3.387603759765625, -3.2584228515625, -3.129241943359375, -3.00006103515625, -2.870880126953125, -2.74169921875, -2.612518310546875, -2.48333740234375, -2.354156494140625, -2.2249755859375, -2.095794677734375, -1.96661376953125, -1.837432861328125, -1.708251953125, -1.579071044921875, -1.44989013671875, -1.320709228515625, -1.1915283203125, -1.062347412109375, -0.93316650390625, -0.803985595703125, -0.6748046875, -0.545623779296875, -0.41644287109375, -0.287261962890625, -0.1580810546875, -0.028900146484375, 0.10028076171875, 0.229461669921875, 0.358642578125, 0.487823486328125, 0.61700439453125, 0.746185302734375, 0.8753662109375, 1.004547119140625, 1.13372802734375, 1.262908935546875, 1.39208984375, 1.521270751953125, 1.65045166015625, 1.779632568359375, 1.9088134765625, 2.037994384765625, 2.16717529296875, 2.296356201171875, 2.425537109375, 2.554718017578125, 2.68389892578125, 2.813079833984375, 2.9422607421875, 3.071441650390625, 3.20062255859375, 3.329803466796875, 3.458984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 14.0, 17.0, 25.0, 28.0, 20.0, 30.0, 26.0, 35.0, 45.0, 53.0, 78.0, 81.0, 268.0, 1730.0, 161.0, 73.0, 62.0, 64.0, 47.0, 27.0, 37.0, 30.0, 11.0, 22.0, 12.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.65625, -22.966552734375, -22.27685546875, -21.587158203125, -20.8974609375, -20.207763671875, -19.51806640625, -18.828369140625, -18.138671875, -17.448974609375, -16.75927734375, -16.069580078125, -15.3798828125, -14.690185546875, -14.00048828125, -13.310791015625, -12.62109375, -11.931396484375, -11.24169921875, -10.552001953125, -9.8623046875, -9.172607421875, -8.48291015625, -7.793212890625, -7.103515625, -6.413818359375, -5.72412109375, -5.034423828125, -4.3447265625, -3.655029296875, -2.96533203125, -2.275634765625, -1.5859375, -0.896240234375, -0.20654296875, 0.483154296875, 1.1728515625, 1.862548828125, 2.55224609375, 3.241943359375, 3.931640625, 4.621337890625, 5.31103515625, 6.000732421875, 6.6904296875, 7.380126953125, 8.06982421875, 8.759521484375, 9.44921875, 10.138916015625, 10.82861328125, 11.518310546875, 12.2080078125, 12.897705078125, 13.58740234375, 14.277099609375, 14.966796875, 15.656494140625, 16.34619140625, 17.035888671875, 17.7255859375, 18.415283203125, 19.10498046875, 19.794677734375, 20.484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 10.0, 13.0, 18.0, 21.0, 52.0, 54.0, 94.0, 149.0, 299.0, 756.0, 13607.0, 3124460.0, 4868.0, 608.0, 280.0, 156.0, 61.0, 64.0, 46.0, 36.0, 19.0, 17.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.25, -65.294921875, -63.33984375, -61.384765625, -59.4296875, -57.474609375, -55.51953125, -53.564453125, -51.609375, -49.654296875, -47.69921875, -45.744140625, -43.7890625, -41.833984375, -39.87890625, -37.923828125, -35.96875, -34.013671875, -32.05859375, -30.103515625, -28.1484375, -26.193359375, -24.23828125, -22.283203125, -20.328125, -18.373046875, -16.41796875, -14.462890625, -12.5078125, -10.552734375, -8.59765625, -6.642578125, -4.6875, -2.732421875, -0.77734375, 1.177734375, 3.1328125, 5.087890625, 7.04296875, 8.998046875, 10.953125, 12.908203125, 14.86328125, 16.818359375, 18.7734375, 20.728515625, 22.68359375, 24.638671875, 26.59375, 28.548828125, 30.50390625, 32.458984375, 34.4140625, 36.369140625, 38.32421875, 40.279296875, 42.234375, 44.189453125, 46.14453125, 48.099609375, 50.0546875, 52.009765625, 53.96484375, 55.919921875, 57.875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 410.0, 596.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-306.86004638671875, -301.4834899902344, -296.10693359375, -290.73040771484375, -285.3538513183594, -279.977294921875, -274.6007385253906, -269.2242126464844, -263.84765625, -258.4710998535156, -253.0945587158203, -247.71800231933594, -242.34146118164062, -236.96490478515625, -231.58836364746094, -226.21180725097656, -220.83526611328125, -215.45870971679688, -210.08216857910156, -204.7056121826172, -199.32907104492188, -193.9525146484375, -188.5759735107422, -183.1994171142578, -177.82286071777344, -172.44630432128906, -167.06976318359375, -161.69320678710938, -156.31666564941406, -150.9401092529297, -145.56356811523438, -140.18701171875, -134.8104705810547, -129.4339141845703, -124.057373046875, -118.68082427978516, -113.30427551269531, -107.92772674560547, -102.55117797851562, -97.17462158203125, -91.79808044433594, -86.4215316772461, -81.04498291015625, -75.6684341430664, -70.29188537597656, -64.91533660888672, -59.53878402709961, -54.162235260009766, -48.78568649291992, -43.40913772583008, -38.032588958740234, -32.656036376953125, -27.279489517211914, -21.90294075012207, -16.526390075683594, -11.14984130859375, -5.773292541503906, -0.3967432975769043, 4.979805946350098, 10.356355667114258, 15.732904434204102, 21.109453201293945, 26.486003875732422, 31.862552642822266, 37.23910140991211]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 12.0, 7.0, 9.0, 16.0, 12.0, 15.0, 12.0, 17.0, 21.0, 21.0, 14.0, 20.0, 27.0, 36.0, 29.0, 29.0, 35.0, 37.0, 34.0, 33.0, 33.0, 41.0, 46.0, 39.0, 31.0, 23.0, 22.0, 34.0, 29.0, 29.0, 14.0, 24.0, 21.0, 20.0, 26.0, 18.0, 14.0, 18.0, 7.0, 13.0, 6.0, 13.0, 7.0, 6.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-34.619956970214844, -33.49950408935547, -32.37905502319336, -31.258602142333984, -30.13814926147461, -29.017698287963867, -27.897247314453125, -26.77679443359375, -25.656343460083008, -24.535892486572266, -23.41543960571289, -22.29498863220215, -21.174537658691406, -20.05408477783203, -18.93363380432129, -17.813182830810547, -16.692729949951172, -15.572278022766113, -14.451826095581055, -13.331375122070312, -12.210923194885254, -11.090471267700195, -9.970020294189453, -8.849568367004395, -7.729116439819336, -6.608664512634277, -5.488213062286377, -4.367761611938477, -3.247309684753418, -2.1268577575683594, -1.006406307220459, 0.1140451431274414, 1.2344970703125, 2.3549487590789795, 3.475400447845459, 4.595851898193359, 5.716303825378418, 6.836755752563477, 7.957207202911377, 9.077658653259277, 10.198110580444336, 11.318562507629395, 12.439014434814453, 13.559465408325195, 14.679917335510254, 15.800369262695312, 16.920820236206055, 18.041271209716797, 19.161724090576172, 20.282175064086914, 21.40262794494629, 22.52307891845703, 23.643531799316406, 24.76398277282715, 25.88443374633789, 27.004886627197266, 28.125337600708008, 29.24578857421875, 30.366241455078125, 31.486692428588867, 32.60714340209961, 33.727596282958984, 34.84804916381836, 35.96849822998047, 37.088951110839844]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 10.0, 16.0, 13.0, 18.0, 22.0, 33.0, 28.0, 26.0, 35.0, 26.0, 39.0, 42.0, 31.0, 45.0, 53.0, 42.0, 43.0, 39.0, 42.0, 51.0, 36.0, 37.0, 35.0, 27.0, 29.0, 21.0, 26.0, 20.0, 15.0, 17.0, 9.0, 6.0, 11.0, 15.0, 5.0, 8.0, 2.0, 1.0, 3.0, 3.0], "bins": [-5.828125, -5.681365966796875, -5.53460693359375, -5.387847900390625, -5.2410888671875, -5.094329833984375, -4.94757080078125, -4.800811767578125, -4.654052734375, -4.507293701171875, -4.36053466796875, -4.213775634765625, -4.0670166015625, -3.920257568359375, -3.77349853515625, -3.626739501953125, -3.47998046875, -3.333221435546875, -3.18646240234375, -3.039703369140625, -2.8929443359375, -2.746185302734375, -2.59942626953125, -2.452667236328125, -2.305908203125, -2.159149169921875, -2.01239013671875, -1.865631103515625, -1.7188720703125, -1.572113037109375, -1.42535400390625, -1.278594970703125, -1.1318359375, -0.985076904296875, -0.83831787109375, -0.691558837890625, -0.5447998046875, -0.398040771484375, -0.25128173828125, -0.104522705078125, 0.042236328125, 0.188995361328125, 0.33575439453125, 0.482513427734375, 0.6292724609375, 0.776031494140625, 0.92279052734375, 1.069549560546875, 1.21630859375, 1.363067626953125, 1.50982666015625, 1.656585693359375, 1.8033447265625, 1.950103759765625, 2.09686279296875, 2.243621826171875, 2.390380859375, 2.537139892578125, 2.68389892578125, 2.830657958984375, 2.9774169921875, 3.124176025390625, 3.27093505859375, 3.417694091796875, 3.564453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 21.0, 13.0, 31.0, 40.0, 29.0, 38.0, 51.0, 80.0, 129.0, 218.0, 508.0, 3086.0, 63141.0, 3217772.0, 892279.0, 14703.0, 1210.0, 289.0, 180.0, 92.0, 68.0, 51.0, 40.0, 32.0, 15.0, 30.0, 21.0, 16.0, 14.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0], "bins": [-28.296875, -27.5673828125, -26.837890625, -26.1083984375, -25.37890625, -24.6494140625, -23.919921875, -23.1904296875, -22.4609375, -21.7314453125, -21.001953125, -20.2724609375, -19.54296875, -18.8134765625, -18.083984375, -17.3544921875, -16.625, -15.8955078125, -15.166015625, -14.4365234375, -13.70703125, -12.9775390625, -12.248046875, -11.5185546875, -10.7890625, -10.0595703125, -9.330078125, -8.6005859375, -7.87109375, -7.1416015625, -6.412109375, -5.6826171875, -4.953125, -4.2236328125, -3.494140625, -2.7646484375, -2.03515625, -1.3056640625, -0.576171875, 0.1533203125, 0.8828125, 1.6123046875, 2.341796875, 3.0712890625, 3.80078125, 4.5302734375, 5.259765625, 5.9892578125, 6.71875, 7.4482421875, 8.177734375, 8.9072265625, 9.63671875, 10.3662109375, 11.095703125, 11.8251953125, 12.5546875, 13.2841796875, 14.013671875, 14.7431640625, 15.47265625, 16.2021484375, 16.931640625, 17.6611328125, 18.390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 13.0, 14.0, 23.0, 25.0, 46.0, 69.0, 86.0, 102.0, 188.0, 230.0, 357.0, 385.0, 486.0, 517.0, 391.0, 331.0, 221.0, 190.0, 131.0, 77.0, 52.0, 38.0, 28.0, 24.0, 17.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4453125, -13.0499267578125, -12.654541015625, -12.2591552734375, -11.86376953125, -11.4683837890625, -11.072998046875, -10.6776123046875, -10.2822265625, -9.8868408203125, -9.491455078125, -9.0960693359375, -8.70068359375, -8.3052978515625, -7.909912109375, -7.5145263671875, -7.119140625, -6.7237548828125, -6.328369140625, -5.9329833984375, -5.53759765625, -5.1422119140625, -4.746826171875, -4.3514404296875, -3.9560546875, -3.5606689453125, -3.165283203125, -2.7698974609375, -2.37451171875, -1.9791259765625, -1.583740234375, -1.1883544921875, -0.79296875, -0.3975830078125, -0.002197265625, 0.3931884765625, 0.78857421875, 1.1839599609375, 1.579345703125, 1.9747314453125, 2.3701171875, 2.7655029296875, 3.160888671875, 3.5562744140625, 3.95166015625, 4.3470458984375, 4.742431640625, 5.1378173828125, 5.533203125, 5.9285888671875, 6.323974609375, 6.7193603515625, 7.11474609375, 7.5101318359375, 7.905517578125, 8.3009033203125, 8.6962890625, 9.0916748046875, 9.487060546875, 9.8824462890625, 10.27783203125, 10.6732177734375, 11.068603515625, 11.4639892578125, 11.859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 9.0, 16.0, 3.0, 14.0, 23.0, 22.0, 45.0, 44.0, 55.0, 103.0, 111.0, 169.0, 227.0, 380.0, 894.0, 4931.0, 170860.0, 3822117.0, 186775.0, 5234.0, 942.0, 422.0, 252.0, 169.0, 123.0, 101.0, 74.0, 39.0, 35.0, 28.0, 17.0, 13.0, 12.0, 6.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.1875, -35.0390625, -33.890625, -32.7421875, -31.59375, -30.4453125, -29.296875, -28.1484375, -27.0, -25.8515625, -24.703125, -23.5546875, -22.40625, -21.2578125, -20.109375, -18.9609375, -17.8125, -16.6640625, -15.515625, -14.3671875, -13.21875, -12.0703125, -10.921875, -9.7734375, -8.625, -7.4765625, -6.328125, -5.1796875, -4.03125, -2.8828125, -1.734375, -0.5859375, 0.5625, 1.7109375, 2.859375, 4.0078125, 5.15625, 6.3046875, 7.453125, 8.6015625, 9.75, 10.8984375, 12.046875, 13.1953125, 14.34375, 15.4921875, 16.640625, 17.7890625, 18.9375, 20.0859375, 21.234375, 22.3828125, 23.53125, 24.6796875, 25.828125, 26.9765625, 28.125, 29.2734375, 30.421875, 31.5703125, 32.71875, 33.8671875, 35.015625, 36.1640625, 37.3125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 31.0, 78.0, 136.0, 200.0, 211.0, 169.0, 105.0, 51.0, 16.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.55401611328125, -63.283809661865234, -60.01360321044922, -56.74340057373047, -53.47319030761719, -50.20298767089844, -46.93278121948242, -43.662574768066406, -40.39236831665039, -37.122161865234375, -33.85195541381836, -30.581750869750977, -27.31154441833496, -24.041337966918945, -20.771133422851562, -17.500926971435547, -14.230720520019531, -10.960514068603516, -7.690308570861816, -4.420103073120117, -1.1498966217041016, 2.120309829711914, 5.390514373779297, 8.660720825195312, 11.930927276611328, 15.201133728027344, 18.47134017944336, 21.741544723510742, 25.011751174926758, 28.281957626342773, 31.552162170410156, 34.82236862182617, 38.09257507324219, 41.3627815246582, 44.63298797607422, 47.90319061279297, 51.17340087890625, 54.443603515625, 57.713809967041016, 60.98401641845703, 64.25422668457031, 67.52442932128906, 70.79463958740234, 74.0648422241211, 77.33505249023438, 80.60525512695312, 83.87545776367188, 87.14566802978516, 90.4158706665039, 93.68607330322266, 96.95628356933594, 100.22648620605469, 103.49669647216797, 106.76689910888672, 110.037109375, 113.30731201171875, 116.5775146484375, 119.84771728515625, 123.11792755126953, 126.38813018798828, 129.65834045410156, 132.9285430908203, 136.19874572753906, 139.46896362304688, 142.73916625976562]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 2.0, 7.0, 28.0, 20.0, 18.0, 22.0, 21.0, 25.0, 41.0, 30.0, 33.0, 37.0, 46.0, 35.0, 47.0, 44.0, 45.0, 57.0, 39.0, 36.0, 32.0, 39.0, 33.0, 41.0, 30.0, 32.0, 21.0, 23.0, 19.0, 16.0, 15.0, 11.0, 8.0, 11.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.150726318359375, -34.92421340942383, -33.69770050048828, -32.471187591552734, -31.244674682617188, -30.01816177368164, -28.791648864746094, -27.565135955810547, -26.338623046875, -25.112110137939453, -23.885597229003906, -22.65908432006836, -21.432571411132812, -20.206058502197266, -18.97954559326172, -17.753032684326172, -16.526519775390625, -15.300006866455078, -14.073493957519531, -12.846981048583984, -11.620468139648438, -10.39395523071289, -9.167442321777344, -7.940929412841797, -6.71441650390625, -5.487903594970703, -4.261390686035156, -3.0348777770996094, -1.8083648681640625, -0.5818519592285156, 0.6446609497070312, 1.8711738586425781, 3.0976905822753906, 4.3242034912109375, 5.550716400146484, 6.777229309082031, 8.003742218017578, 9.230255126953125, 10.456768035888672, 11.683280944824219, 12.909793853759766, 14.136306762695312, 15.36281967163086, 16.589332580566406, 17.815845489501953, 19.0423583984375, 20.268871307373047, 21.495384216308594, 22.72189712524414, 23.948410034179688, 25.174922943115234, 26.40143585205078, 27.627948760986328, 28.854461669921875, 30.080974578857422, 31.30748748779297, 32.534000396728516, 33.76051330566406, 34.98702621459961, 36.213539123535156, 37.4400520324707, 38.66656494140625, 39.8930778503418, 41.119590759277344, 42.34610366821289]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 8.0, 9.0, 8.0, 15.0, 20.0, 19.0, 19.0, 26.0, 30.0, 30.0, 52.0, 33.0, 46.0, 49.0, 42.0, 46.0, 42.0, 48.0, 41.0, 37.0, 45.0, 33.0, 43.0, 22.0, 23.0, 33.0, 32.0, 28.0, 16.0, 15.0, 10.0, 11.0, 9.0, 12.0, 11.0, 6.0, 3.0, 7.0, 4.0, 2.0], "bins": [-6.1953125, -6.04296875, -5.890625, -5.73828125, -5.5859375, -5.43359375, -5.28125, -5.12890625, -4.9765625, -4.82421875, -4.671875, -4.51953125, -4.3671875, -4.21484375, -4.0625, -3.91015625, -3.7578125, -3.60546875, -3.453125, -3.30078125, -3.1484375, -2.99609375, -2.84375, -2.69140625, -2.5390625, -2.38671875, -2.234375, -2.08203125, -1.9296875, -1.77734375, -1.625, -1.47265625, -1.3203125, -1.16796875, -1.015625, -0.86328125, -0.7109375, -0.55859375, -0.40625, -0.25390625, -0.1015625, 0.05078125, 0.203125, 0.35546875, 0.5078125, 0.66015625, 0.8125, 0.96484375, 1.1171875, 1.26953125, 1.421875, 1.57421875, 1.7265625, 1.87890625, 2.03125, 2.18359375, 2.3359375, 2.48828125, 2.640625, 2.79296875, 2.9453125, 3.09765625, 3.25, 3.40234375, 3.5546875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 7.0, 11.0, 17.0, 29.0, 43.0, 64.0, 79.0, 134.0, 195.0, 275.0, 444.0, 672.0, 946.0, 1413.0, 2242.0, 3232.0, 5228.0, 8278.0, 12758.0, 20593.0, 33330.0, 54897.0, 91440.0, 151345.0, 207747.0, 174894.0, 108367.0, 64597.0, 39175.0, 24265.0, 14882.0, 9516.0, 6000.0, 4024.0, 2564.0, 1623.0, 1080.0, 760.0, 442.0, 330.0, 211.0, 133.0, 99.0, 72.0, 30.0, 23.0, 14.0, 15.0, 9.0, 6.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.50732421875, -0.491302490234375, -0.47528076171875, -0.459259033203125, -0.4432373046875, -0.427215576171875, -0.41119384765625, -0.395172119140625, -0.379150390625, -0.363128662109375, -0.34710693359375, -0.331085205078125, -0.3150634765625, -0.299041748046875, -0.28302001953125, -0.266998291015625, -0.2509765625, -0.234954833984375, -0.21893310546875, -0.202911376953125, -0.1868896484375, -0.170867919921875, -0.15484619140625, -0.138824462890625, -0.122802734375, -0.106781005859375, -0.09075927734375, -0.074737548828125, -0.0587158203125, -0.042694091796875, -0.02667236328125, -0.010650634765625, 0.00537109375, 0.021392822265625, 0.03741455078125, 0.053436279296875, 0.0694580078125, 0.085479736328125, 0.10150146484375, 0.117523193359375, 0.133544921875, 0.149566650390625, 0.16558837890625, 0.181610107421875, 0.1976318359375, 0.213653564453125, 0.22967529296875, 0.245697021484375, 0.26171875, 0.277740478515625, 0.29376220703125, 0.309783935546875, 0.3258056640625, 0.341827392578125, 0.35784912109375, 0.373870849609375, 0.389892578125, 0.405914306640625, 0.42193603515625, 0.437957763671875, 0.4539794921875, 0.470001220703125, 0.48602294921875, 0.502044677734375, 0.51806640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 11.0, 12.0, 5.0, 16.0, 22.0, 22.0, 24.0, 26.0, 28.0, 22.0, 39.0, 30.0, 33.0, 33.0, 41.0, 31.0, 39.0, 1061.0, 45.0, 53.0, 41.0, 30.0, 45.0, 35.0, 29.0, 32.0, 25.0, 25.0, 29.0, 17.0, 13.0, 19.0, 20.0, 10.0, 8.0, 5.0, 11.0, 7.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.849609375, -2.757293701171875, -2.66497802734375, -2.572662353515625, -2.4803466796875, -2.388031005859375, -2.29571533203125, -2.203399658203125, -2.111083984375, -2.018768310546875, -1.92645263671875, -1.834136962890625, -1.7418212890625, -1.649505615234375, -1.55718994140625, -1.464874267578125, -1.37255859375, -1.280242919921875, -1.18792724609375, -1.095611572265625, -1.0032958984375, -0.910980224609375, -0.81866455078125, -0.726348876953125, -0.634033203125, -0.541717529296875, -0.44940185546875, -0.357086181640625, -0.2647705078125, -0.172454833984375, -0.08013916015625, 0.012176513671875, 0.1044921875, 0.196807861328125, 0.28912353515625, 0.381439208984375, 0.4737548828125, 0.566070556640625, 0.65838623046875, 0.750701904296875, 0.843017578125, 0.935333251953125, 1.02764892578125, 1.119964599609375, 1.2122802734375, 1.304595947265625, 1.39691162109375, 1.489227294921875, 1.58154296875, 1.673858642578125, 1.76617431640625, 1.858489990234375, 1.9508056640625, 2.043121337890625, 2.13543701171875, 2.227752685546875, 2.320068359375, 2.412384033203125, 2.50469970703125, 2.597015380859375, 2.6893310546875, 2.781646728515625, 2.87396240234375, 2.966278076171875, 3.05859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 19.0, 20.0, 28.0, 62.0, 67.0, 98.0, 142.0, 213.0, 320.0, 476.0, 729.0, 1127.0, 1639.0, 2599.0, 4161.0, 6314.0, 10043.0, 15863.0, 26158.0, 42823.0, 70496.0, 114014.0, 162312.0, 1229071.0, 148895.0, 99700.0, 61294.0, 36968.0, 22736.0, 14131.0, 8556.0, 5678.0, 3529.0, 2224.0, 1562.0, 1016.0, 655.0, 439.0, 305.0, 211.0, 138.0, 87.0, 64.0, 38.0, 24.0, 25.0, 17.0, 10.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.349609375, -0.3384590148925781, -0.32730865478515625, -0.3161582946777344, -0.3050079345703125, -0.2938575744628906, -0.28270721435546875, -0.2715568542480469, -0.260406494140625, -0.24925613403320312, -0.23810577392578125, -0.22695541381835938, -0.2158050537109375, -0.20465469360351562, -0.19350433349609375, -0.18235397338867188, -0.17120361328125, -0.16005325317382812, -0.14890289306640625, -0.13775253295898438, -0.1266021728515625, -0.11545181274414062, -0.10430145263671875, -0.09315109252929688, -0.082000732421875, -0.07085037231445312, -0.05970001220703125, -0.048549652099609375, -0.0373992919921875, -0.026248931884765625, -0.01509857177734375, -0.003948211669921875, 0.0072021484375, 0.018352508544921875, 0.02950286865234375, 0.040653228759765625, 0.0518035888671875, 0.06295394897460938, 0.07410430908203125, 0.08525466918945312, 0.096405029296875, 0.10755538940429688, 0.11870574951171875, 0.12985610961914062, 0.1410064697265625, 0.15215682983398438, 0.16330718994140625, 0.17445755004882812, 0.18560791015625, 0.19675827026367188, 0.20790863037109375, 0.21905899047851562, 0.2302093505859375, 0.24135971069335938, 0.25251007080078125, 0.2636604309082031, 0.274810791015625, 0.2859611511230469, 0.29711151123046875, 0.3082618713378906, 0.3194122314453125, 0.3305625915527344, 0.34171295166015625, 0.3528633117675781, 0.364013671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 10.0, 5.0, 10.0, 9.0, 13.0, 24.0, 22.0, 22.0, 30.0, 40.0, 42.0, 48.0, 66.0, 52.0, 57.0, 71.0, 59.0, 65.0, 58.0, 52.0, 45.0, 38.0, 35.0, 17.0, 21.0, 20.0, 19.0, 12.0, 9.0, 10.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.0011986792087554932, -0.001156628131866455, -0.001114577054977417, -0.001072525978088379, -0.0010304749011993408, -0.0009884238243103027, -0.0009463727474212646, -0.0009043216705322266, -0.0008622705936431885, -0.0008202195167541504, -0.0007781684398651123, -0.0007361173629760742, -0.0006940662860870361, -0.000652015209197998, -0.00060996413230896, -0.0005679130554199219, -0.0005258619785308838, -0.0004838109016418457, -0.0004417598247528076, -0.00039970874786376953, -0.00035765767097473145, -0.00031560659408569336, -0.0002735555171966553, -0.0002315044403076172, -0.0001894533634185791, -0.00014740228652954102, -0.00010535120964050293, -6.330013275146484e-05, -2.1249055862426758e-05, 2.0802021026611328e-05, 6.285309791564941e-05, 0.0001049041748046875, 0.00014695525169372559, 0.00018900632858276367, 0.00023105740547180176, 0.00027310848236083984, 0.00031515955924987793, 0.000357210636138916, 0.0003992617130279541, 0.0004413127899169922, 0.0004833638668060303, 0.0005254149436950684, 0.0005674660205841064, 0.0006095170974731445, 0.0006515681743621826, 0.0006936192512512207, 0.0007356703281402588, 0.0007777214050292969, 0.000819772481918335, 0.000861823558807373, 0.0009038746356964111, 0.0009459257125854492, 0.0009879767894744873, 0.0010300278663635254, 0.0010720789432525635, 0.0011141300201416016, 0.0011561810970306396, 0.0011982321739196777, 0.0012402832508087158, 0.001282334327697754, 0.001324385404586792, 0.00136643648147583, 0.0014084875583648682, 0.0014505386352539062]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 9.0, 10.0, 16.0, 24.0, 26.0, 50.0, 50.0, 90.0, 143.0, 254.0, 456.0, 1816.0, 649730.0, 393263.0, 1451.0, 482.0, 258.0, 125.0, 80.0, 44.0, 35.0, 31.0, 26.0, 19.0, 10.0, 15.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03118896484375, -0.03027033805847168, -0.02935171127319336, -0.02843308448791504, -0.02751445770263672, -0.0265958309173584, -0.025677204132080078, -0.024758577346801758, -0.023839950561523438, -0.022921323776245117, -0.022002696990966797, -0.021084070205688477, -0.020165443420410156, -0.019246816635131836, -0.018328189849853516, -0.017409563064575195, -0.016490936279296875, -0.015572309494018555, -0.014653682708740234, -0.013735055923461914, -0.012816429138183594, -0.011897802352905273, -0.010979175567626953, -0.010060548782348633, -0.009141921997070312, -0.008223295211791992, -0.007304668426513672, -0.0063860416412353516, -0.005467414855957031, -0.004548788070678711, -0.0036301612854003906, -0.0027115345001220703, -0.00179290771484375, -0.0008742809295654297, 4.4345855712890625e-05, 0.0009629726409912109, 0.0018815994262695312, 0.0028002262115478516, 0.003718852996826172, 0.004637479782104492, 0.0055561065673828125, 0.006474733352661133, 0.007393360137939453, 0.008311986923217773, 0.009230613708496094, 0.010149240493774414, 0.011067867279052734, 0.011986494064331055, 0.012905120849609375, 0.013823747634887695, 0.014742374420166016, 0.015661001205444336, 0.016579627990722656, 0.017498254776000977, 0.018416881561279297, 0.019335508346557617, 0.020254135131835938, 0.021172761917114258, 0.022091388702392578, 0.0230100154876709, 0.02392864227294922, 0.02484726905822754, 0.02576589584350586, 0.02668452262878418, 0.0276031494140625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 30.0, 927.0, 62.0], "bins": [-0.02315860614180565, -0.02278851717710495, -0.02241842821240425, -0.022048339247703552, -0.021678250283002853, -0.021308161318302155, -0.020938072353601456, -0.020567981526255608, -0.02019789256155491, -0.01982780359685421, -0.01945771463215351, -0.019087625667452812, -0.018717536702752113, -0.018347445875406265, -0.017977356910705566, -0.017607267946004868, -0.01723717898130417, -0.01686709001660347, -0.01649700105190277, -0.016126912087202072, -0.015756823122501373, -0.0153867332264781, -0.015016644261777401, -0.014646555297076702, -0.014276467263698578, -0.013906378298997879, -0.01353628933429718, -0.013166200369596481, -0.012796110473573208, -0.012426021508872509, -0.01205593254417181, -0.011685843579471111, -0.011315753683447838, -0.010945664718747139, -0.01057557575404644, -0.010205486789345741, -0.009835396893322468, -0.009465307928621769, -0.00909521896392107, -0.008725129999220371, -0.008355040103197098, -0.007984951138496399, -0.007614861708134413, -0.007244772743433714, -0.006874683313071728, -0.006504594348371029, -0.00613450538367033, -0.005764416418969631, -0.005394327454268932, -0.0050242384895682335, -0.004654149059206247, -0.0042840600945055485, -0.003913970664143562, -0.0035438816994428635, -0.0031737927347421646, -0.002803703537210822, -0.0024336143396794796, -0.002063525142148137, -0.0016934360610321164, -0.0013233469799160957, -0.0009532577823847532, -0.0005831685848534107, -0.00021307962015271187, 0.00015700957737863064, 0.0005270987749099731]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 11.0, 9.0, 20.0, 23.0, 22.0, 18.0, 32.0, 39.0, 48.0, 57.0, 55.0, 62.0, 48.0, 52.0, 55.0, 52.0, 50.0, 40.0, 54.0, 43.0, 37.0, 45.0, 30.0, 21.0, 12.0, 13.0, 16.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006859898567199707, -0.0006585754454135895, -0.0006311610341072083, -0.000603746622800827, -0.0005763322114944458, -0.0005489178001880646, -0.0005215033888816833, -0.0004940889775753021, -0.0004666745662689209, -0.00043926015496253967, -0.00041184574365615845, -0.0003844313323497772, -0.000357016921043396, -0.00032960250973701477, -0.00030218809843063354, -0.0002747736871242523, -0.0002473592758178711, -0.00021994486451148987, -0.00019253045320510864, -0.00016511604189872742, -0.0001377016305923462, -0.00011028721928596497, -8.287280797958374e-05, -5.5458396673202515e-05, -2.804398536682129e-05, -6.295740604400635e-07, 2.6784837245941162e-05, 5.419924855232239e-05, 8.161365985870361e-05, 0.00010902807116508484, 0.00013644248247146606, 0.0001638568937778473, 0.00019127130508422852, 0.00021868571639060974, 0.00024610012769699097, 0.0002735145390033722, 0.0003009289503097534, 0.00032834336161613464, 0.00035575777292251587, 0.0003831721842288971, 0.0004105865955352783, 0.00043800100684165955, 0.00046541541814804077, 0.000492829829454422, 0.0005202442407608032, 0.0005476586520671844, 0.0005750730633735657, 0.0006024874746799469, 0.0006299018859863281, 0.0006573162972927094, 0.0006847307085990906, 0.0007121451199054718, 0.000739559531211853, 0.0007669739425182343, 0.0007943883538246155, 0.0008218027651309967, 0.0008492171764373779, 0.0008766315877437592, 0.0009040459990501404, 0.0009314604103565216, 0.0009588748216629028, 0.000986289232969284, 0.0010137036442756653, 0.0010411180555820465, 0.0010685324668884277]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 8.0, 9.0, 8.0, 15.0, 20.0, 19.0, 19.0, 26.0, 30.0, 30.0, 52.0, 33.0, 46.0, 49.0, 42.0, 46.0, 42.0, 48.0, 41.0, 37.0, 45.0, 33.0, 43.0, 22.0, 23.0, 33.0, 32.0, 28.0, 16.0, 15.0, 10.0, 11.0, 9.0, 12.0, 11.0, 6.0, 3.0, 7.0, 4.0, 2.0], "bins": [-6.1953125, -6.04296875, -5.890625, -5.73828125, -5.5859375, -5.43359375, -5.28125, -5.12890625, -4.9765625, -4.82421875, -4.671875, -4.51953125, -4.3671875, -4.21484375, -4.0625, -3.91015625, -3.7578125, -3.60546875, -3.453125, -3.30078125, -3.1484375, -2.99609375, -2.84375, -2.69140625, -2.5390625, -2.38671875, -2.234375, -2.08203125, -1.9296875, -1.77734375, -1.625, -1.47265625, -1.3203125, -1.16796875, -1.015625, -0.86328125, -0.7109375, -0.55859375, -0.40625, -0.25390625, -0.1015625, 0.05078125, 0.203125, 0.35546875, 0.5078125, 0.66015625, 0.8125, 0.96484375, 1.1171875, 1.26953125, 1.421875, 1.57421875, 1.7265625, 1.87890625, 2.03125, 2.18359375, 2.3359375, 2.48828125, 2.640625, 2.79296875, 2.9453125, 3.09765625, 3.25, 3.40234375, 3.5546875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 11.0, 16.0, 28.0, 30.0, 81.0, 130.0, 249.0, 491.0, 878.0, 1745.0, 3457.0, 6839.0, 14517.0, 33167.0, 93482.0, 343523.0, 380973.0, 102505.0, 36116.0, 15384.0, 7449.0, 3684.0, 1825.0, 916.0, 474.0, 259.0, 140.0, 79.0, 42.0, 17.0, 15.0, 17.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.7755126953125, -3.640869140625, -3.5062255859375, -3.37158203125, -3.2369384765625, -3.102294921875, -2.9676513671875, -2.8330078125, -2.6983642578125, -2.563720703125, -2.4290771484375, -2.29443359375, -2.1597900390625, -2.025146484375, -1.8905029296875, -1.755859375, -1.6212158203125, -1.486572265625, -1.3519287109375, -1.21728515625, -1.0826416015625, -0.947998046875, -0.8133544921875, -0.6787109375, -0.5440673828125, -0.409423828125, -0.2747802734375, -0.14013671875, -0.0054931640625, 0.129150390625, 0.2637939453125, 0.3984375, 0.5330810546875, 0.667724609375, 0.8023681640625, 0.93701171875, 1.0716552734375, 1.206298828125, 1.3409423828125, 1.4755859375, 1.6102294921875, 1.744873046875, 1.8795166015625, 2.01416015625, 2.1488037109375, 2.283447265625, 2.4180908203125, 2.552734375, 2.6873779296875, 2.822021484375, 2.9566650390625, 3.09130859375, 3.2259521484375, 3.360595703125, 3.4952392578125, 3.6298828125, 3.7645263671875, 3.899169921875, 4.0338134765625, 4.16845703125, 4.3031005859375, 4.437744140625, 4.5723876953125, 4.70703125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 7.0, 5.0, 3.0, 18.0, 6.0, 12.0, 25.0, 20.0, 21.0, 33.0, 35.0, 36.0, 36.0, 44.0, 46.0, 52.0, 86.0, 157.0, 1571.0, 246.0, 107.0, 78.0, 55.0, 40.0, 35.0, 41.0, 22.0, 27.0, 29.0, 25.0, 16.0, 22.0, 13.0, 14.0, 12.0, 8.0, 8.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.109375, -16.569580078125, -16.02978515625, -15.489990234375, -14.9501953125, -14.410400390625, -13.87060546875, -13.330810546875, -12.791015625, -12.251220703125, -11.71142578125, -11.171630859375, -10.6318359375, -10.092041015625, -9.55224609375, -9.012451171875, -8.47265625, -7.932861328125, -7.39306640625, -6.853271484375, -6.3134765625, -5.773681640625, -5.23388671875, -4.694091796875, -4.154296875, -3.614501953125, -3.07470703125, -2.534912109375, -1.9951171875, -1.455322265625, -0.91552734375, -0.375732421875, 0.1640625, 0.703857421875, 1.24365234375, 1.783447265625, 2.3232421875, 2.863037109375, 3.40283203125, 3.942626953125, 4.482421875, 5.022216796875, 5.56201171875, 6.101806640625, 6.6416015625, 7.181396484375, 7.72119140625, 8.260986328125, 8.80078125, 9.340576171875, 9.88037109375, 10.420166015625, 10.9599609375, 11.499755859375, 12.03955078125, 12.579345703125, 13.119140625, 13.658935546875, 14.19873046875, 14.738525390625, 15.2783203125, 15.818115234375, 16.35791015625, 16.897705078125, 17.4375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 12.0, 13.0, 24.0, 21.0, 39.0, 51.0, 76.0, 148.0, 199.0, 367.0, 813.0, 9278.0, 3110508.0, 22072.0, 1064.0, 379.0, 199.0, 130.0, 94.0, 54.0, 45.0, 19.0, 26.0, 10.0, 14.0, 6.0, 7.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.34375, -55.5283203125, -53.712890625, -51.8974609375, -50.08203125, -48.2666015625, -46.451171875, -44.6357421875, -42.8203125, -41.0048828125, -39.189453125, -37.3740234375, -35.55859375, -33.7431640625, -31.927734375, -30.1123046875, -28.296875, -26.4814453125, -24.666015625, -22.8505859375, -21.03515625, -19.2197265625, -17.404296875, -15.5888671875, -13.7734375, -11.9580078125, -10.142578125, -8.3271484375, -6.51171875, -4.6962890625, -2.880859375, -1.0654296875, 0.75, 2.5654296875, 4.380859375, 6.1962890625, 8.01171875, 9.8271484375, 11.642578125, 13.4580078125, 15.2734375, 17.0888671875, 18.904296875, 20.7197265625, 22.53515625, 24.3505859375, 26.166015625, 27.9814453125, 29.796875, 31.6123046875, 33.427734375, 35.2431640625, 37.05859375, 38.8740234375, 40.689453125, 42.5048828125, 44.3203125, 46.1357421875, 47.951171875, 49.7666015625, 51.58203125, 53.3974609375, 55.212890625, 57.0283203125, 58.84375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 20.0, 40.0, 87.0, 158.0, 187.0, 203.0, 150.0, 92.0, 38.0, 19.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.02022361755371, -18.85841178894043, -17.69659996032715, -16.534788131713867, -15.372976303100586, -14.211164474487305, -13.049351692199707, -11.887539863586426, -10.725728034973145, -9.563916206359863, -8.402104377746582, -7.240292072296143, -6.078480243682861, -4.91666841506958, -3.7548561096191406, -2.5930442810058594, -1.4312324523925781, -0.2694205045700073, 0.8923914432525635, 2.054203510284424, 3.216015338897705, 4.377827167510986, 5.539639472961426, 6.701451301574707, 7.863263130187988, 9.02507495880127, 10.18688678741455, 11.348699569702148, 12.51051139831543, 13.672323226928711, 14.834135055541992, 15.995946884155273, 17.157760620117188, 18.31957244873047, 19.48138427734375, 20.64319610595703, 21.805007934570312, 22.966819763183594, 24.128631591796875, 25.290443420410156, 26.452255249023438, 27.61406707763672, 28.77587890625, 29.93769073486328, 31.099502563476562, 32.261314392089844, 33.423126220703125, 34.584938049316406, 35.74674987792969, 36.90856170654297, 38.07037353515625, 39.23218536376953, 40.39399719238281, 41.555809020996094, 42.717620849609375, 43.879432678222656, 45.0412483215332, 46.203060150146484, 47.364871978759766, 48.52668380737305, 49.68849563598633, 50.85030746459961, 52.01211929321289, 53.17393112182617, 54.33574295043945]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 7.0, 10.0, 7.0, 11.0, 18.0, 13.0, 19.0, 15.0, 24.0, 22.0, 26.0, 37.0, 47.0, 28.0, 33.0, 40.0, 37.0, 40.0, 41.0, 35.0, 47.0, 42.0, 36.0, 39.0, 33.0, 34.0, 30.0, 29.0, 22.0, 28.0, 22.0, 21.0, 21.0, 20.0, 13.0, 9.0, 9.0, 11.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-50.722442626953125, -49.169769287109375, -47.617095947265625, -46.064422607421875, -44.511749267578125, -42.959075927734375, -41.406402587890625, -39.853729248046875, -38.301055908203125, -36.748382568359375, -35.195709228515625, -33.643035888671875, -32.090362548828125, -30.537689208984375, -28.985013961791992, -27.432340621948242, -25.87966537475586, -24.32699203491211, -22.77431869506836, -21.22164535522461, -19.66897201538086, -18.11629867553711, -16.563623428344727, -15.010950088500977, -13.458276748657227, -11.905603408813477, -10.352930068969727, -8.80025577545166, -7.24758243560791, -5.69490909576416, -4.142234802246094, -2.5895614624023438, -1.0368881225585938, 0.5157854557037354, 2.0684590339660645, 3.6211328506469727, 5.173806190490723, 6.726479530334473, 8.279153823852539, 9.831827163696289, 11.384500503540039, 12.937173843383789, 14.489847183227539, 16.042522430419922, 17.595195770263672, 19.147869110107422, 20.700542449951172, 22.253215789794922, 23.805889129638672, 25.358562469482422, 26.911235809326172, 28.463909149169922, 30.016582489013672, 31.569255828857422, 33.12193298339844, 34.67460632324219, 36.22727966308594, 37.77995300292969, 39.33262634277344, 40.88529968261719, 42.43797302246094, 43.99064636230469, 45.54331970214844, 47.09599304199219, 48.64866638183594]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 4.0, 7.0, 9.0, 4.0, 14.0, 29.0, 13.0, 20.0, 29.0, 35.0, 24.0, 43.0, 42.0, 46.0, 38.0, 60.0, 37.0, 55.0, 45.0, 47.0, 49.0, 43.0, 42.0, 30.0, 30.0, 36.0, 27.0, 31.0, 21.0, 17.0, 17.0, 7.0, 9.0, 11.0, 9.0, 6.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.86529541015625, -6.6876220703125, -6.50994873046875, -6.332275390625, -6.15460205078125, -5.9769287109375, -5.79925537109375, -5.62158203125, -5.44390869140625, -5.2662353515625, -5.08856201171875, -4.910888671875, -4.73321533203125, -4.5555419921875, -4.37786865234375, -4.2001953125, -4.02252197265625, -3.8448486328125, -3.66717529296875, -3.489501953125, -3.31182861328125, -3.1341552734375, -2.95648193359375, -2.77880859375, -2.60113525390625, -2.4234619140625, -2.24578857421875, -2.068115234375, -1.89044189453125, -1.7127685546875, -1.53509521484375, -1.357421875, -1.17974853515625, -1.0020751953125, -0.82440185546875, -0.646728515625, -0.46905517578125, -0.2913818359375, -0.11370849609375, 0.06396484375, 0.24163818359375, 0.4193115234375, 0.59698486328125, 0.774658203125, 0.95233154296875, 1.1300048828125, 1.30767822265625, 1.4853515625, 1.66302490234375, 1.8406982421875, 2.01837158203125, 2.196044921875, 2.37371826171875, 2.5513916015625, 2.72906494140625, 2.90673828125, 3.08441162109375, 3.2620849609375, 3.43975830078125, 3.617431640625, 3.79510498046875, 3.9727783203125, 4.15045166015625, 4.328125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 5.0, 16.0, 20.0, 43.0, 38.0, 60.0, 74.0, 160.0, 239.0, 403.0, 883.0, 2469.0, 8697.0, 40676.0, 269411.0, 1614054.0, 1843529.0, 347741.0, 50834.0, 10254.0, 2652.0, 919.0, 435.0, 222.0, 140.0, 87.0, 76.0, 41.0, 34.0, 20.0, 13.0, 9.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -10.0855712890625, -9.780517578125, -9.4754638671875, -9.17041015625, -8.8653564453125, -8.560302734375, -8.2552490234375, -7.9501953125, -7.6451416015625, -7.340087890625, -7.0350341796875, -6.72998046875, -6.4249267578125, -6.119873046875, -5.8148193359375, -5.509765625, -5.2047119140625, -4.899658203125, -4.5946044921875, -4.28955078125, -3.9844970703125, -3.679443359375, -3.3743896484375, -3.0693359375, -2.7642822265625, -2.459228515625, -2.1541748046875, -1.84912109375, -1.5440673828125, -1.239013671875, -0.9339599609375, -0.62890625, -0.3238525390625, -0.018798828125, 0.2862548828125, 0.59130859375, 0.8963623046875, 1.201416015625, 1.5064697265625, 1.8115234375, 2.1165771484375, 2.421630859375, 2.7266845703125, 3.03173828125, 3.3367919921875, 3.641845703125, 3.9468994140625, 4.251953125, 4.5570068359375, 4.862060546875, 5.1671142578125, 5.47216796875, 5.7772216796875, 6.082275390625, 6.3873291015625, 6.6923828125, 6.9974365234375, 7.302490234375, 7.6075439453125, 7.91259765625, 8.2176513671875, 8.522705078125, 8.8277587890625, 9.1328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 8.0, 11.0, 11.0, 12.0, 22.0, 32.0, 39.0, 39.0, 61.0, 71.0, 95.0, 123.0, 180.0, 223.0, 293.0, 338.0, 355.0, 383.0, 356.0, 296.0, 258.0, 209.0, 144.0, 125.0, 95.0, 63.0, 50.0, 44.0, 28.0, 26.0, 20.0, 9.0, 9.0, 14.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0474853515625, -8.727783203125, -8.4080810546875, -8.08837890625, -7.7686767578125, -7.448974609375, -7.1292724609375, -6.8095703125, -6.4898681640625, -6.170166015625, -5.8504638671875, -5.53076171875, -5.2110595703125, -4.891357421875, -4.5716552734375, -4.251953125, -3.9322509765625, -3.612548828125, -3.2928466796875, -2.97314453125, -2.6534423828125, -2.333740234375, -2.0140380859375, -1.6943359375, -1.3746337890625, -1.054931640625, -0.7352294921875, -0.41552734375, -0.0958251953125, 0.223876953125, 0.5435791015625, 0.86328125, 1.1829833984375, 1.502685546875, 1.8223876953125, 2.14208984375, 2.4617919921875, 2.781494140625, 3.1011962890625, 3.4208984375, 3.7406005859375, 4.060302734375, 4.3800048828125, 4.69970703125, 5.0194091796875, 5.339111328125, 5.6588134765625, 5.978515625, 6.2982177734375, 6.617919921875, 6.9376220703125, 7.25732421875, 7.5770263671875, 7.896728515625, 8.2164306640625, 8.5361328125, 8.8558349609375, 9.175537109375, 9.4952392578125, 9.81494140625, 10.1346435546875, 10.454345703125, 10.7740478515625, 11.09375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 11.0, 11.0, 24.0, 24.0, 19.0, 31.0, 33.0, 53.0, 50.0, 81.0, 90.0, 131.0, 203.0, 306.0, 582.0, 1989.0, 31191.0, 1715032.0, 2396928.0, 43221.0, 2516.0, 626.0, 322.0, 199.0, 155.0, 101.0, 95.0, 49.0, 45.0, 40.0, 24.0, 26.0, 8.0, 12.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.53125, -30.54736328125, -29.5634765625, -28.57958984375, -27.595703125, -26.61181640625, -25.6279296875, -24.64404296875, -23.66015625, -22.67626953125, -21.6923828125, -20.70849609375, -19.724609375, -18.74072265625, -17.7568359375, -16.77294921875, -15.7890625, -14.80517578125, -13.8212890625, -12.83740234375, -11.853515625, -10.86962890625, -9.8857421875, -8.90185546875, -7.91796875, -6.93408203125, -5.9501953125, -4.96630859375, -3.982421875, -2.99853515625, -2.0146484375, -1.03076171875, -0.046875, 0.93701171875, 1.9208984375, 2.90478515625, 3.888671875, 4.87255859375, 5.8564453125, 6.84033203125, 7.82421875, 8.80810546875, 9.7919921875, 10.77587890625, 11.759765625, 12.74365234375, 13.7275390625, 14.71142578125, 15.6953125, 16.67919921875, 17.6630859375, 18.64697265625, 19.630859375, 20.61474609375, 21.5986328125, 22.58251953125, 23.56640625, 24.55029296875, 25.5341796875, 26.51806640625, 27.501953125, 28.48583984375, 29.4697265625, 30.45361328125, 31.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 21.0, 62.0, 127.0, 180.0, 238.0, 201.0, 108.0, 48.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.86643981933594, -110.5593490600586, -107.25226593017578, -103.94517517089844, -100.6380844116211, -97.33099365234375, -94.02391052246094, -90.7168197631836, -87.40972900390625, -84.1026382446289, -80.7955551147461, -77.48846435546875, -74.1813735961914, -70.87428283691406, -67.56719970703125, -64.2601089477539, -60.95302200317383, -57.64593505859375, -54.338844299316406, -51.03175735473633, -47.724666595458984, -44.417579650878906, -41.11048889160156, -37.803401947021484, -34.496315002441406, -31.189226150512695, -27.882137298583984, -24.575050354003906, -21.267959594726562, -17.960872650146484, -14.653783798217773, -11.346694946289062, -8.039604187011719, -4.732515335083008, -1.425426959991455, 1.8816614151000977, 5.188750267028809, 8.495838165283203, 11.802927017211914, 15.110015869140625, 18.417104721069336, 21.724193572998047, 25.031282424926758, 28.33837127685547, 31.645458221435547, 34.952545166015625, 38.25963592529297, 41.56672668457031, 44.87381362915039, 48.18090057373047, 51.48799133300781, 54.79507827758789, 58.102169036865234, 61.40925598144531, 64.71634674072266, 68.0234375, 71.33052062988281, 74.63761138916016, 77.94469451904297, 81.25178527832031, 84.55887603759766, 87.865966796875, 91.17304992675781, 94.48014068603516, 97.7872314453125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 7.0, 3.0, 14.0, 12.0, 19.0, 12.0, 14.0, 15.0, 18.0, 21.0, 20.0, 23.0, 25.0, 27.0, 28.0, 39.0, 36.0, 36.0, 37.0, 33.0, 26.0, 38.0, 38.0, 31.0, 31.0, 37.0, 28.0, 32.0, 31.0, 30.0, 29.0, 36.0, 19.0, 14.0, 20.0, 16.0, 16.0, 12.0, 13.0, 8.0, 8.0, 8.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-31.427268981933594, -30.416793823242188, -29.406320571899414, -28.39584732055664, -27.385372161865234, -26.374897003173828, -25.364423751831055, -24.35395050048828, -23.343475341796875, -22.33300018310547, -21.322526931762695, -20.312053680419922, -19.301578521728516, -18.29110336303711, -17.280630111694336, -16.270156860351562, -15.259681701660156, -14.249207496643066, -13.238733291625977, -12.228259086608887, -11.217784881591797, -10.207310676574707, -9.196836471557617, -8.186362266540527, -7.1758880615234375, -6.165413856506348, -5.154939651489258, -4.144465446472168, -3.133991241455078, -2.1235170364379883, -1.1130428314208984, -0.1025686264038086, 0.9079055786132812, 1.918379783630371, 2.928853988647461, 3.939328193664551, 4.949802398681641, 5.9602766036987305, 6.97075080871582, 7.98122501373291, 8.99169921875, 10.00217342376709, 11.01264762878418, 12.02312183380127, 13.03359603881836, 14.04407024383545, 15.054544448852539, 16.065017700195312, 17.07549285888672, 18.085968017578125, 19.0964412689209, 20.106914520263672, 21.117389678955078, 22.127864837646484, 23.138338088989258, 24.14881134033203, 25.159286499023438, 26.169761657714844, 27.180234909057617, 28.19070816040039, 29.201183319091797, 30.211658477783203, 31.222131729125977, 32.23260498046875, 33.243080139160156]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 19.0, 19.0, 20.0, 20.0, 31.0, 24.0, 33.0, 27.0, 38.0, 35.0, 42.0, 40.0, 22.0, 47.0, 53.0, 48.0, 46.0, 46.0, 32.0, 41.0, 36.0, 35.0, 27.0, 22.0, 28.0, 17.0, 16.0, 15.0, 14.0, 5.0, 12.0, 9.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.58203125, -5.423583984375, -5.26513671875, -5.106689453125, -4.9482421875, -4.789794921875, -4.63134765625, -4.472900390625, -4.314453125, -4.156005859375, -3.99755859375, -3.839111328125, -3.6806640625, -3.522216796875, -3.36376953125, -3.205322265625, -3.046875, -2.888427734375, -2.72998046875, -2.571533203125, -2.4130859375, -2.254638671875, -2.09619140625, -1.937744140625, -1.779296875, -1.620849609375, -1.46240234375, -1.303955078125, -1.1455078125, -0.987060546875, -0.82861328125, -0.670166015625, -0.51171875, -0.353271484375, -0.19482421875, -0.036376953125, 0.1220703125, 0.280517578125, 0.43896484375, 0.597412109375, 0.755859375, 0.914306640625, 1.07275390625, 1.231201171875, 1.3896484375, 1.548095703125, 1.70654296875, 1.864990234375, 2.0234375, 2.181884765625, 2.34033203125, 2.498779296875, 2.6572265625, 2.815673828125, 2.97412109375, 3.132568359375, 3.291015625, 3.449462890625, 3.60791015625, 3.766357421875, 3.9248046875, 4.083251953125, 4.24169921875, 4.400146484375, 4.55859375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 7.0, 5.0, 11.0, 9.0, 14.0, 23.0, 42.0, 57.0, 93.0, 118.0, 186.0, 304.0, 434.0, 668.0, 981.0, 1514.0, 2301.0, 3716.0, 5816.0, 9174.0, 14550.0, 23764.0, 38818.0, 64106.0, 108326.0, 172740.0, 206605.0, 153586.0, 94259.0, 56385.0, 34092.0, 20881.0, 12889.0, 7888.0, 5053.0, 3183.0, 2083.0, 1214.0, 850.0, 604.0, 365.0, 251.0, 183.0, 103.0, 92.0, 58.0, 40.0, 31.0, 30.0, 21.0, 10.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.465576171875, -0.4491615295410156, -0.43274688720703125, -0.4163322448730469, -0.3999176025390625, -0.3835029602050781, -0.36708831787109375, -0.3506736755371094, -0.334259033203125, -0.3178443908691406, -0.30142974853515625, -0.2850151062011719, -0.2686004638671875, -0.2521858215332031, -0.23577117919921875, -0.21935653686523438, -0.20294189453125, -0.18652725219726562, -0.17011260986328125, -0.15369796752929688, -0.1372833251953125, -0.12086868286132812, -0.10445404052734375, -0.08803939819335938, -0.071624755859375, -0.055210113525390625, -0.03879547119140625, -0.022380828857421875, -0.0059661865234375, 0.010448455810546875, 0.02686309814453125, 0.043277740478515625, 0.0596923828125, 0.07610702514648438, 0.09252166748046875, 0.10893630981445312, 0.1253509521484375, 0.14176559448242188, 0.15818023681640625, 0.17459487915039062, 0.191009521484375, 0.20742416381835938, 0.22383880615234375, 0.24025344848632812, 0.2566680908203125, 0.2730827331542969, 0.28949737548828125, 0.3059120178222656, 0.32232666015625, 0.3387413024902344, 0.35515594482421875, 0.3715705871582031, 0.3879852294921875, 0.4043998718261719, 0.42081451416015625, 0.4372291564941406, 0.453643798828125, 0.4700584411621094, 0.48647308349609375, 0.5028877258300781, 0.5193023681640625, 0.5357170104980469, 0.5521316528320312, 0.5685462951660156, 0.5849609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 1.0, 4.0, 8.0, 6.0, 10.0, 12.0, 19.0, 18.0, 12.0, 14.0, 17.0, 19.0, 28.0, 31.0, 27.0, 33.0, 33.0, 34.0, 44.0, 36.0, 42.0, 35.0, 1051.0, 38.0, 29.0, 42.0, 27.0, 36.0, 40.0, 27.0, 32.0, 25.0, 25.0, 22.0, 24.0, 13.0, 18.0, 9.0, 8.0, 11.0, 5.0, 11.0, 9.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.048828125, -2.9586181640625, -2.868408203125, -2.7781982421875, -2.68798828125, -2.5977783203125, -2.507568359375, -2.4173583984375, -2.3271484375, -2.2369384765625, -2.146728515625, -2.0565185546875, -1.96630859375, -1.8760986328125, -1.785888671875, -1.6956787109375, -1.60546875, -1.5152587890625, -1.425048828125, -1.3348388671875, -1.24462890625, -1.1544189453125, -1.064208984375, -0.9739990234375, -0.8837890625, -0.7935791015625, -0.703369140625, -0.6131591796875, -0.52294921875, -0.4327392578125, -0.342529296875, -0.2523193359375, -0.162109375, -0.0718994140625, 0.018310546875, 0.1085205078125, 0.19873046875, 0.2889404296875, 0.379150390625, 0.4693603515625, 0.5595703125, 0.6497802734375, 0.739990234375, 0.8302001953125, 0.92041015625, 1.0106201171875, 1.100830078125, 1.1910400390625, 1.28125, 1.3714599609375, 1.461669921875, 1.5518798828125, 1.64208984375, 1.7322998046875, 1.822509765625, 1.9127197265625, 2.0029296875, 2.0931396484375, 2.183349609375, 2.2735595703125, 2.36376953125, 2.4539794921875, 2.544189453125, 2.6343994140625, 2.724609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 8.0, 5.0, 10.0, 21.0, 26.0, 39.0, 72.0, 96.0, 149.0, 226.0, 392.0, 596.0, 898.0, 1557.0, 2419.0, 4046.0, 6470.0, 10974.0, 18801.0, 32905.0, 57234.0, 100145.0, 160500.0, 1250996.0, 175967.0, 115314.0, 66711.0, 37681.0, 21650.0, 12277.0, 7381.0, 4411.0, 2591.0, 1672.0, 989.0, 659.0, 433.0, 277.0, 158.0, 135.0, 73.0, 66.0, 40.0, 25.0, 16.0, 14.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42626953125, -0.4127922058105469, -0.39931488037109375, -0.3858375549316406, -0.3723602294921875, -0.3588829040527344, -0.34540557861328125, -0.3319282531738281, -0.318450927734375, -0.3049736022949219, -0.29149627685546875, -0.2780189514160156, -0.2645416259765625, -0.2510643005371094, -0.23758697509765625, -0.22410964965820312, -0.21063232421875, -0.19715499877929688, -0.18367767333984375, -0.17020034790039062, -0.1567230224609375, -0.14324569702148438, -0.12976837158203125, -0.11629104614257812, -0.102813720703125, -0.08933639526367188, -0.07585906982421875, -0.062381744384765625, -0.0489044189453125, -0.035427093505859375, -0.02194976806640625, -0.008472442626953125, 0.0050048828125, 0.018482208251953125, 0.03195953369140625, 0.045436859130859375, 0.0589141845703125, 0.07239151000976562, 0.08586883544921875, 0.09934616088867188, 0.112823486328125, 0.12630081176757812, 0.13977813720703125, 0.15325546264648438, 0.1667327880859375, 0.18021011352539062, 0.19368743896484375, 0.20716476440429688, 0.22064208984375, 0.23411941528320312, 0.24759674072265625, 0.2610740661621094, 0.2745513916015625, 0.2880287170410156, 0.30150604248046875, 0.3149833679199219, 0.328460693359375, 0.3419380187988281, 0.35541534423828125, 0.3688926696777344, 0.3823699951171875, 0.3958473205566406, 0.40932464599609375, 0.4228019714355469, 0.436279296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 10.0, 8.0, 10.0, 19.0, 19.0, 15.0, 24.0, 29.0, 34.0, 37.0, 40.0, 59.0, 71.0, 71.0, 70.0, 60.0, 70.0, 57.0, 59.0, 44.0, 41.0, 34.0, 30.0, 16.0, 13.0, 12.0, 12.0, 9.0, 8.0, 1.0, 6.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013179779052734375, -0.001270294189453125, -0.0012226104736328125, -0.0011749267578125, -0.0011272430419921875, -0.001079559326171875, -0.0010318756103515625, -0.00098419189453125, -0.0009365081787109375, -0.000888824462890625, -0.0008411407470703125, -0.00079345703125, -0.0007457733154296875, -0.000698089599609375, -0.0006504058837890625, -0.00060272216796875, -0.0005550384521484375, -0.000507354736328125, -0.0004596710205078125, -0.0004119873046875, -0.0003643035888671875, -0.000316619873046875, -0.0002689361572265625, -0.00022125244140625, -0.0001735687255859375, -0.000125885009765625, -7.82012939453125e-05, -3.0517578125e-05, 1.71661376953125e-05, 6.4849853515625e-05, 0.0001125335693359375, 0.00016021728515625, 0.0002079010009765625, 0.000255584716796875, 0.0003032684326171875, 0.0003509521484375, 0.0003986358642578125, 0.000446319580078125, 0.0004940032958984375, 0.00054168701171875, 0.0005893707275390625, 0.000637054443359375, 0.0006847381591796875, 0.000732421875, 0.0007801055908203125, 0.000827789306640625, 0.0008754730224609375, 0.00092315673828125, 0.0009708404541015625, 0.001018524169921875, 0.0010662078857421875, 0.0011138916015625, 0.0011615753173828125, 0.001209259033203125, 0.0012569427490234375, 0.00130462646484375, 0.0013523101806640625, 0.001399993896484375, 0.0014476776123046875, 0.001495361328125, 0.0015430450439453125, 0.001590728759765625, 0.0016384124755859375, 0.00168609619140625, 0.0017337799072265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 24.0, 31.0, 29.0, 48.0, 66.0, 89.0, 140.0, 287.0, 648.0, 4401.0, 991029.0, 49730.0, 1054.0, 346.0, 176.0, 115.0, 66.0, 55.0, 38.0, 25.0, 20.0, 15.0, 18.0, 23.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0338134765625, -0.03286623954772949, -0.031919002532958984, -0.030971765518188477, -0.03002452850341797, -0.02907729148864746, -0.028130054473876953, -0.027182817459106445, -0.026235580444335938, -0.02528834342956543, -0.024341106414794922, -0.023393869400024414, -0.022446632385253906, -0.0214993953704834, -0.02055215835571289, -0.019604921340942383, -0.018657684326171875, -0.017710447311401367, -0.01676321029663086, -0.01581597328186035, -0.014868736267089844, -0.013921499252319336, -0.012974262237548828, -0.01202702522277832, -0.011079788208007812, -0.010132551193237305, -0.009185314178466797, -0.008238077163696289, -0.007290840148925781, -0.0063436031341552734, -0.005396366119384766, -0.004449129104614258, -0.00350189208984375, -0.002554655075073242, -0.0016074180603027344, -0.0006601810455322266, 0.00028705596923828125, 0.001234292984008789, 0.002181529998779297, 0.0031287670135498047, 0.0040760040283203125, 0.00502324104309082, 0.005970478057861328, 0.006917715072631836, 0.007864952087402344, 0.008812189102172852, 0.00975942611694336, 0.010706663131713867, 0.011653900146484375, 0.012601137161254883, 0.01354837417602539, 0.014495611190795898, 0.015442848205566406, 0.016390085220336914, 0.017337322235107422, 0.01828455924987793, 0.019231796264648438, 0.020179033279418945, 0.021126270294189453, 0.02207350730895996, 0.02302074432373047, 0.023967981338500977, 0.024915218353271484, 0.025862455368041992, 0.0268096923828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 40.0, 784.0, 188.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014264358207583427, -0.013971385546028614, -0.013678411953151226, -0.013385439291596413, -0.0130924666300416, -0.012799493037164211, -0.012506520375609398, -0.01221354678273201, -0.011920574121177197, -0.011627601459622383, -0.011334627866744995, -0.011041655205190182, -0.010748682543635368, -0.01045570895075798, -0.010162736289203167, -0.009869763627648354, -0.009576790034770966, -0.009283817373216152, -0.008990843780338764, -0.00869787111878395, -0.008404898457229137, -0.00811192486435175, -0.007818952202796936, -0.007525979075580835, -0.007233006879687309, -0.006940033752471209, -0.006647061090916395, -0.0063540879637002945, -0.006061114836484194, -0.005768141709268093, -0.00547516904771328, -0.005182195920497179, -0.004889222327619791, -0.00459624920040369, -0.004303276538848877, -0.004010303411632776, -0.0037173302844166756, -0.0034243573900312185, -0.0031313844956457615, -0.002838411368429661, -0.0025454384740442038, -0.0022524655796587467, -0.001959492452442646, -0.001666519558057189, -0.0013735465472564101, -0.0010805735364556313, -0.0007876006420701742, -0.0004946275148540735, -0.00020165462046861649, 9.131836122833192e-05, 0.00038429134292528033, 0.0006772642955183983, 0.0009702373063191772, 0.001263210317119956, 0.001556183211505413, 0.0018491563387215137, 0.002142129233106971, 0.002435102127492428, 0.0027280752547085285, 0.0030210481490939856, 0.0033140210434794426, 0.0036069941706955433, 0.0038999670650810003, 0.004192939959466457, 0.004485913086682558]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 10.0, 15.0, 13.0, 20.0, 10.0, 22.0, 22.0, 29.0, 27.0, 30.0, 30.0, 27.0, 46.0, 41.0, 46.0, 43.0, 50.0, 44.0, 34.0, 44.0, 43.0, 33.0, 27.0, 27.0, 29.0, 27.0, 30.0, 22.0, 22.0, 19.0, 15.0, 14.0, 7.0, 10.0, 5.0, 10.0, 12.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0006848573684692383, -0.0006638104096055031, -0.0006427634507417679, -0.0006217164918780327, -0.0006006695330142975, -0.0005796225741505623, -0.0005585756152868271, -0.0005375286564230919, -0.0005164816975593567, -0.0004954347386956215, -0.0004743877798318863, -0.0004533408209681511, -0.0004322938621044159, -0.0004112469032406807, -0.0003901999443769455, -0.0003691529855132103, -0.0003481060266494751, -0.0003270590677857399, -0.0003060121089220047, -0.0002849651500582695, -0.0002639181911945343, -0.0002428712323307991, -0.0002218242734670639, -0.0002007773146033287, -0.0001797303557395935, -0.0001586833968758583, -0.0001376364380121231, -0.00011658947914838791, -9.554252028465271e-05, -7.449556142091751e-05, -5.344860255718231e-05, -3.240164369344711e-05, -1.1354684829711914e-05, 9.692274034023285e-06, 3.0739232897758484e-05, 5.178619176149368e-05, 7.283315062522888e-05, 9.388010948896408e-05, 0.00011492706835269928, 0.00013597402721643448, 0.00015702098608016968, 0.00017806794494390488, 0.00019911490380764008, 0.00022016186267137527, 0.00024120882153511047, 0.00026225578039884567, 0.00028330273926258087, 0.00030434969812631607, 0.00032539665699005127, 0.00034644361585378647, 0.00036749057471752167, 0.00038853753358125687, 0.00040958449244499207, 0.00043063145130872726, 0.00045167841017246246, 0.00047272536903619766, 0.0004937723278999329, 0.0005148192867636681, 0.0005358662456274033, 0.0005569132044911385, 0.0005779601633548737, 0.0005990071222186089, 0.0006200540810823441, 0.0006411010399460793, 0.0006621479988098145]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 19.0, 19.0, 20.0, 20.0, 31.0, 24.0, 33.0, 27.0, 38.0, 35.0, 42.0, 40.0, 22.0, 47.0, 53.0, 48.0, 46.0, 46.0, 33.0, 40.0, 36.0, 35.0, 27.0, 22.0, 28.0, 17.0, 16.0, 15.0, 14.0, 5.0, 12.0, 9.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.58203125, -5.423583984375, -5.26513671875, -5.106689453125, -4.9482421875, -4.789794921875, -4.63134765625, -4.472900390625, -4.314453125, -4.156005859375, -3.99755859375, -3.839111328125, -3.6806640625, -3.522216796875, -3.36376953125, -3.205322265625, -3.046875, -2.888427734375, -2.72998046875, -2.571533203125, -2.4130859375, -2.254638671875, -2.09619140625, -1.937744140625, -1.779296875, -1.620849609375, -1.46240234375, -1.303955078125, -1.1455078125, -0.987060546875, -0.82861328125, -0.670166015625, -0.51171875, -0.353271484375, -0.19482421875, -0.036376953125, 0.1220703125, 0.280517578125, 0.43896484375, 0.597412109375, 0.755859375, 0.914306640625, 1.07275390625, 1.231201171875, 1.3896484375, 1.548095703125, 1.70654296875, 1.864990234375, 2.0234375, 2.181884765625, 2.34033203125, 2.498779296875, 2.6572265625, 2.815673828125, 2.97412109375, 3.132568359375, 3.291015625, 3.449462890625, 3.60791015625, 3.766357421875, 3.9248046875, 4.083251953125, 4.24169921875, 4.400146484375, 4.55859375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 12.0, 21.0, 47.0, 66.0, 127.0, 223.0, 446.0, 841.0, 1689.0, 3837.0, 9132.0, 24038.0, 65107.0, 198823.0, 446316.0, 194737.0, 63346.0, 23446.0, 9019.0, 3762.0, 1711.0, 869.0, 442.0, 203.0, 121.0, 64.0, 43.0, 20.0, 6.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.57421875, -5.41259765625, -5.2509765625, -5.08935546875, -4.927734375, -4.76611328125, -4.6044921875, -4.44287109375, -4.28125, -4.11962890625, -3.9580078125, -3.79638671875, -3.634765625, -3.47314453125, -3.3115234375, -3.14990234375, -2.98828125, -2.82666015625, -2.6650390625, -2.50341796875, -2.341796875, -2.18017578125, -2.0185546875, -1.85693359375, -1.6953125, -1.53369140625, -1.3720703125, -1.21044921875, -1.048828125, -0.88720703125, -0.7255859375, -0.56396484375, -0.40234375, -0.24072265625, -0.0791015625, 0.08251953125, 0.244140625, 0.40576171875, 0.5673828125, 0.72900390625, 0.890625, 1.05224609375, 1.2138671875, 1.37548828125, 1.537109375, 1.69873046875, 1.8603515625, 2.02197265625, 2.18359375, 2.34521484375, 2.5068359375, 2.66845703125, 2.830078125, 2.99169921875, 3.1533203125, 3.31494140625, 3.4765625, 3.63818359375, 3.7998046875, 3.96142578125, 4.123046875, 4.28466796875, 4.4462890625, 4.60791015625, 4.76953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 11.0, 11.0, 18.0, 21.0, 21.0, 25.0, 37.0, 42.0, 52.0, 58.0, 61.0, 91.0, 245.0, 1743.0, 148.0, 85.0, 63.0, 56.0, 47.0, 43.0, 34.0, 37.0, 20.0, 13.0, 11.0, 14.0, 12.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.453125, -27.57421875, -26.6953125, -25.81640625, -24.9375, -24.05859375, -23.1796875, -22.30078125, -21.421875, -20.54296875, -19.6640625, -18.78515625, -17.90625, -17.02734375, -16.1484375, -15.26953125, -14.390625, -13.51171875, -12.6328125, -11.75390625, -10.875, -9.99609375, -9.1171875, -8.23828125, -7.359375, -6.48046875, -5.6015625, -4.72265625, -3.84375, -2.96484375, -2.0859375, -1.20703125, -0.328125, 0.55078125, 1.4296875, 2.30859375, 3.1875, 4.06640625, 4.9453125, 5.82421875, 6.703125, 7.58203125, 8.4609375, 9.33984375, 10.21875, 11.09765625, 11.9765625, 12.85546875, 13.734375, 14.61328125, 15.4921875, 16.37109375, 17.25, 18.12890625, 19.0078125, 19.88671875, 20.765625, 21.64453125, 22.5234375, 23.40234375, 24.28125, 25.16015625, 26.0390625, 26.91796875, 27.796875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 10.0, 15.0, 17.0, 20.0, 18.0, 27.0, 51.0, 73.0, 108.0, 157.0, 224.0, 322.0, 836.0, 6477.0, 3099538.0, 35060.0, 1429.0, 440.0, 264.0, 185.0, 127.0, 76.0, 50.0, 34.0, 31.0, 22.0, 21.0, 16.0, 11.0, 4.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.125, -57.197265625, -55.26953125, -53.341796875, -51.4140625, -49.486328125, -47.55859375, -45.630859375, -43.703125, -41.775390625, -39.84765625, -37.919921875, -35.9921875, -34.064453125, -32.13671875, -30.208984375, -28.28125, -26.353515625, -24.42578125, -22.498046875, -20.5703125, -18.642578125, -16.71484375, -14.787109375, -12.859375, -10.931640625, -9.00390625, -7.076171875, -5.1484375, -3.220703125, -1.29296875, 0.634765625, 2.5625, 4.490234375, 6.41796875, 8.345703125, 10.2734375, 12.201171875, 14.12890625, 16.056640625, 17.984375, 19.912109375, 21.83984375, 23.767578125, 25.6953125, 27.623046875, 29.55078125, 31.478515625, 33.40625, 35.333984375, 37.26171875, 39.189453125, 41.1171875, 43.044921875, 44.97265625, 46.900390625, 48.828125, 50.755859375, 52.68359375, 54.611328125, 56.5390625, 58.466796875, 60.39453125, 62.322265625, 64.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 12.0, 209.0, 664.0, 127.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.230323791503906, -39.09013366699219, -34.9499397277832, -30.809749603271484, -26.669557571411133, -22.52936553955078, -18.389175415039062, -14.248983383178711, -10.10879135131836, -5.968599796295166, -1.8284082412719727, 2.3117828369140625, 6.451974868774414, 10.592166900634766, 14.732357025146484, 18.872549057006836, 23.012741088867188, 27.15293312072754, 31.29312515258789, 35.43331527709961, 39.573509216308594, 43.71369934082031, 47.85388946533203, 51.99407958984375, 56.134273529052734, 60.27446365356445, 64.41465759277344, 68.55484771728516, 72.69503784179688, 76.83523559570312, 80.97541809082031, 85.11561584472656, 89.25581359863281, 93.39600372314453, 97.53619384765625, 101.6763916015625, 105.81658172607422, 109.95677185058594, 114.09696197509766, 118.23715209960938, 122.37734985351562, 126.51753997802734, 130.65773010253906, 134.7979278564453, 138.9381103515625, 143.07830810546875, 147.218505859375, 151.3586883544922, 155.49887084960938, 159.63906860351562, 163.7792510986328, 167.91944885253906, 172.05963134765625, 176.1998291015625, 180.34002685546875, 184.48020935058594, 188.6204071044922, 192.76060485839844, 196.90078735351562, 201.04098510742188, 205.18116760253906, 209.3213653564453, 213.4615478515625, 217.60174560546875, 221.741943359375]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 9.0, 11.0, 8.0, 14.0, 22.0, 16.0, 33.0, 25.0, 27.0, 28.0, 28.0, 34.0, 36.0, 43.0, 43.0, 47.0, 33.0, 46.0, 44.0, 37.0, 31.0, 32.0, 41.0, 34.0, 29.0, 35.0, 26.0, 33.0, 24.0, 13.0, 15.0, 25.0, 7.0, 19.0, 12.0, 6.0, 14.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-51.82158660888672, -50.33015060424805, -48.838714599609375, -47.3472785949707, -45.85584259033203, -44.364402770996094, -42.87297058105469, -41.38153076171875, -39.89009475708008, -38.398658752441406, -36.907222747802734, -35.41578674316406, -33.92435073852539, -32.43291473388672, -30.941476821899414, -29.45003890991211, -27.95860481262207, -26.4671688079834, -24.975732803344727, -23.484294891357422, -21.99285888671875, -20.501422882080078, -19.009986877441406, -17.518550872802734, -16.027114868164062, -14.53567886352539, -13.044241905212402, -11.55280590057373, -10.061368942260742, -8.56993293762207, -7.078496932983398, -5.58705997467041, -4.095623016357422, -2.604186534881592, -1.1127502918243408, 0.37868595123291016, 1.8701224327087402, 3.3615589141845703, 4.852994918823242, 6.3444318771362305, 7.835867881774902, 9.327303886413574, 10.818740844726562, 12.310176849365234, 13.801612854003906, 15.293049812316895, 16.78448486328125, 18.275922775268555, 19.767358779907227, 21.2587947845459, 22.75023078918457, 24.241668701171875, 25.733104705810547, 27.22454071044922, 28.71597671508789, 30.207412719726562, 31.698848724365234, 33.190284729003906, 34.68172073364258, 36.17315673828125, 37.66459274291992, 39.156028747558594, 40.64746856689453, 42.1389045715332, 43.630340576171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 10.0, 10.0, 13.0, 15.0, 11.0, 17.0, 32.0, 26.0, 19.0, 26.0, 34.0, 33.0, 30.0, 27.0, 31.0, 44.0, 42.0, 41.0, 43.0, 36.0, 51.0, 32.0, 38.0, 38.0, 24.0, 32.0, 26.0, 17.0, 40.0, 23.0, 14.0, 14.0, 17.0, 9.0, 11.0, 7.0, 10.0, 8.0, 6.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-5.05859375, -4.90625, -4.75390625, -4.6015625, -4.44921875, -4.296875, -4.14453125, -3.9921875, -3.83984375, -3.6875, -3.53515625, -3.3828125, -3.23046875, -3.078125, -2.92578125, -2.7734375, -2.62109375, -2.46875, -2.31640625, -2.1640625, -2.01171875, -1.859375, -1.70703125, -1.5546875, -1.40234375, -1.25, -1.09765625, -0.9453125, -0.79296875, -0.640625, -0.48828125, -0.3359375, -0.18359375, -0.03125, 0.12109375, 0.2734375, 0.42578125, 0.578125, 0.73046875, 0.8828125, 1.03515625, 1.1875, 1.33984375, 1.4921875, 1.64453125, 1.796875, 1.94921875, 2.1015625, 2.25390625, 2.40625, 2.55859375, 2.7109375, 2.86328125, 3.015625, 3.16796875, 3.3203125, 3.47265625, 3.625, 3.77734375, 3.9296875, 4.08203125, 4.234375, 4.38671875, 4.5390625, 4.69140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 6.0, 10.0, 13.0, 12.0, 13.0, 17.0, 18.0, 20.0, 26.0, 28.0, 33.0, 43.0, 61.0, 127.0, 301.0, 1261.0, 9090.0, 251236.0, 3392004.0, 523228.0, 14308.0, 1616.0, 327.0, 129.0, 69.0, 39.0, 30.0, 41.0, 24.0, 17.0, 21.0, 18.0, 17.0, 12.0, 12.0, 4.0, 5.0, 9.0, 5.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0], "bins": [-22.21875, -21.594482421875, -20.97021484375, -20.345947265625, -19.7216796875, -19.097412109375, -18.47314453125, -17.848876953125, -17.224609375, -16.600341796875, -15.97607421875, -15.351806640625, -14.7275390625, -14.103271484375, -13.47900390625, -12.854736328125, -12.23046875, -11.606201171875, -10.98193359375, -10.357666015625, -9.7333984375, -9.109130859375, -8.48486328125, -7.860595703125, -7.236328125, -6.612060546875, -5.98779296875, -5.363525390625, -4.7392578125, -4.114990234375, -3.49072265625, -2.866455078125, -2.2421875, -1.617919921875, -0.99365234375, -0.369384765625, 0.2548828125, 0.879150390625, 1.50341796875, 2.127685546875, 2.751953125, 3.376220703125, 4.00048828125, 4.624755859375, 5.2490234375, 5.873291015625, 6.49755859375, 7.121826171875, 7.74609375, 8.370361328125, 8.99462890625, 9.618896484375, 10.2431640625, 10.867431640625, 11.49169921875, 12.115966796875, 12.740234375, 13.364501953125, 13.98876953125, 14.613037109375, 15.2373046875, 15.861572265625, 16.48583984375, 17.110107421875, 17.734375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 6.0, 12.0, 10.0, 12.0, 14.0, 22.0, 22.0, 35.0, 39.0, 66.0, 60.0, 89.0, 112.0, 165.0, 190.0, 234.0, 314.0, 332.0, 386.0, 328.0, 351.0, 293.0, 213.0, 170.0, 124.0, 113.0, 79.0, 66.0, 49.0, 46.0, 20.0, 19.0, 28.0, 8.0, 10.0, 7.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8203125, -9.52001953125, -9.2197265625, -8.91943359375, -8.619140625, -8.31884765625, -8.0185546875, -7.71826171875, -7.41796875, -7.11767578125, -6.8173828125, -6.51708984375, -6.216796875, -5.91650390625, -5.6162109375, -5.31591796875, -5.015625, -4.71533203125, -4.4150390625, -4.11474609375, -3.814453125, -3.51416015625, -3.2138671875, -2.91357421875, -2.61328125, -2.31298828125, -2.0126953125, -1.71240234375, -1.412109375, -1.11181640625, -0.8115234375, -0.51123046875, -0.2109375, 0.08935546875, 0.3896484375, 0.68994140625, 0.990234375, 1.29052734375, 1.5908203125, 1.89111328125, 2.19140625, 2.49169921875, 2.7919921875, 3.09228515625, 3.392578125, 3.69287109375, 3.9931640625, 4.29345703125, 4.59375, 4.89404296875, 5.1943359375, 5.49462890625, 5.794921875, 6.09521484375, 6.3955078125, 6.69580078125, 6.99609375, 7.29638671875, 7.5966796875, 7.89697265625, 8.197265625, 8.49755859375, 8.7978515625, 9.09814453125, 9.3984375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 8.0, 6.0, 10.0, 13.0, 21.0, 35.0, 35.0, 49.0, 78.0, 98.0, 184.0, 220.0, 373.0, 1203.0, 16497.0, 2940529.0, 1224989.0, 7964.0, 899.0, 352.0, 183.0, 146.0, 110.0, 69.0, 57.0, 40.0, 27.0, 22.0, 22.0, 11.0, 10.0, 12.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.09375, -45.74462890625, -44.3955078125, -43.04638671875, -41.697265625, -40.34814453125, -38.9990234375, -37.64990234375, -36.30078125, -34.95166015625, -33.6025390625, -32.25341796875, -30.904296875, -29.55517578125, -28.2060546875, -26.85693359375, -25.5078125, -24.15869140625, -22.8095703125, -21.46044921875, -20.111328125, -18.76220703125, -17.4130859375, -16.06396484375, -14.71484375, -13.36572265625, -12.0166015625, -10.66748046875, -9.318359375, -7.96923828125, -6.6201171875, -5.27099609375, -3.921875, -2.57275390625, -1.2236328125, 0.12548828125, 1.474609375, 2.82373046875, 4.1728515625, 5.52197265625, 6.87109375, 8.22021484375, 9.5693359375, 10.91845703125, 12.267578125, 13.61669921875, 14.9658203125, 16.31494140625, 17.6640625, 19.01318359375, 20.3623046875, 21.71142578125, 23.060546875, 24.40966796875, 25.7587890625, 27.10791015625, 28.45703125, 29.80615234375, 31.1552734375, 32.50439453125, 33.853515625, 35.20263671875, 36.5517578125, 37.90087890625, 39.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 128.0, 475.0, 359.0, 48.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.47235107421875, -97.2499008178711, -89.02745056152344, -80.80499267578125, -72.5825424194336, -64.36009216308594, -56.137638092041016, -47.915184020996094, -39.69273376464844, -31.47028160095215, -23.24782943725586, -15.02537727355957, -6.802925109863281, 1.419525146484375, 9.641979217529297, 17.86443328857422, 26.086883544921875, 34.30933380126953, 42.53178787231445, 50.754241943359375, 58.97669219970703, 67.19914245605469, 75.42160034179688, 83.64405059814453, 91.86650085449219, 100.08895111083984, 108.3114013671875, 116.53385925292969, 124.75630950927734, 132.978759765625, 141.2012176513672, 149.42367553710938, 157.64614868164062, 165.8686065673828, 174.09104919433594, 182.31350708007812, 190.53594970703125, 198.75840759277344, 206.98086547851562, 215.20330810546875, 223.42576599121094, 231.64822387695312, 239.87066650390625, 248.09312438964844, 256.3155822753906, 264.53802490234375, 272.7604675292969, 280.9829406738281, 289.20538330078125, 297.4278259277344, 305.6502990722656, 313.87274169921875, 322.0951843261719, 330.317626953125, 338.54010009765625, 346.7625427246094, 354.9849853515625, 363.2074279785156, 371.4299011230469, 379.65234375, 387.8747863769531, 396.09722900390625, 404.3197021484375, 412.5421447753906, 420.7646179199219]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 9.0, 6.0, 13.0, 15.0, 14.0, 16.0, 25.0, 20.0, 30.0, 32.0, 34.0, 20.0, 28.0, 28.0, 39.0, 44.0, 41.0, 50.0, 33.0, 43.0, 33.0, 40.0, 33.0, 32.0, 39.0, 34.0, 29.0, 29.0, 31.0, 18.0, 30.0, 19.0, 12.0, 18.0, 12.0, 11.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.222694396972656, -34.116905212402344, -33.01111602783203, -31.90532875061035, -30.79953956604004, -29.693750381469727, -28.587963104248047, -27.482173919677734, -26.376384735107422, -25.27059555053711, -24.164806365966797, -23.059019088745117, -21.953229904174805, -20.847440719604492, -19.741653442382812, -18.6358642578125, -17.530075073242188, -16.424285888671875, -15.318497657775879, -14.212709426879883, -13.10692024230957, -12.001131057739258, -10.895342826843262, -9.789554595947266, -8.683765411376953, -7.577976703643799, -6.4721879959106445, -5.36639928817749, -4.260610580444336, -3.1548218727111816, -2.0490331649780273, -0.943244457244873, 0.16254425048828125, 1.2683329582214355, 2.37412166595459, 3.479910373687744, 4.585699081420898, 5.691487789154053, 6.797276496887207, 7.903065204620361, 9.008853912353516, 10.114643096923828, 11.220431327819824, 12.32621955871582, 13.432008743286133, 14.537797927856445, 15.643586158752441, 16.749374389648438, 17.85516357421875, 18.960952758789062, 20.066741943359375, 21.172529220581055, 22.278318405151367, 23.38410758972168, 24.48989486694336, 25.595684051513672, 26.701473236083984, 27.807262420654297, 28.91305160522461, 30.01883888244629, 31.1246280670166, 32.23041534423828, 33.336204528808594, 34.441993713378906, 35.54778289794922]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 12.0, 9.0, 20.0, 13.0, 21.0, 15.0, 28.0, 25.0, 22.0, 23.0, 36.0, 36.0, 41.0, 32.0, 41.0, 40.0, 44.0, 40.0, 40.0, 44.0, 34.0, 31.0, 30.0, 38.0, 32.0, 25.0, 28.0, 25.0, 27.0, 21.0, 19.0, 18.0, 9.0, 10.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-5.16796875, -5.01397705078125, -4.8599853515625, -4.70599365234375, -4.552001953125, -4.39801025390625, -4.2440185546875, -4.09002685546875, -3.93603515625, -3.78204345703125, -3.6280517578125, -3.47406005859375, -3.320068359375, -3.16607666015625, -3.0120849609375, -2.85809326171875, -2.7041015625, -2.55010986328125, -2.3961181640625, -2.24212646484375, -2.088134765625, -1.93414306640625, -1.7801513671875, -1.62615966796875, -1.47216796875, -1.31817626953125, -1.1641845703125, -1.01019287109375, -0.856201171875, -0.70220947265625, -0.5482177734375, -0.39422607421875, -0.240234375, -0.08624267578125, 0.0677490234375, 0.22174072265625, 0.375732421875, 0.52972412109375, 0.6837158203125, 0.83770751953125, 0.99169921875, 1.14569091796875, 1.2996826171875, 1.45367431640625, 1.607666015625, 1.76165771484375, 1.9156494140625, 2.06964111328125, 2.2236328125, 2.37762451171875, 2.5316162109375, 2.68560791015625, 2.839599609375, 2.99359130859375, 3.1475830078125, 3.30157470703125, 3.45556640625, 3.60955810546875, 3.7635498046875, 3.91754150390625, 4.071533203125, 4.22552490234375, 4.3795166015625, 4.53350830078125, 4.6875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 16.0, 15.0, 25.0, 38.0, 58.0, 62.0, 96.0, 166.0, 277.0, 400.0, 564.0, 816.0, 1176.0, 1828.0, 2758.0, 4018.0, 5982.0, 9073.0, 13774.0, 21112.0, 33150.0, 52093.0, 83904.0, 132541.0, 181890.0, 173309.0, 120179.0, 75695.0, 47215.0, 29601.0, 19209.0, 12653.0, 8187.0, 5388.0, 3657.0, 2435.0, 1693.0, 1134.0, 787.0, 471.0, 399.0, 216.0, 154.0, 125.0, 68.0, 49.0, 32.0, 14.0, 19.0, 12.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.491455078125, -0.4755439758300781, -0.45963287353515625, -0.4437217712402344, -0.4278106689453125, -0.4118995666503906, -0.39598846435546875, -0.3800773620605469, -0.364166259765625, -0.3482551574707031, -0.33234405517578125, -0.3164329528808594, -0.3005218505859375, -0.2846107482910156, -0.26869964599609375, -0.2527885437011719, -0.23687744140625, -0.22096633911132812, -0.20505523681640625, -0.18914413452148438, -0.1732330322265625, -0.15732192993164062, -0.14141082763671875, -0.12549972534179688, -0.109588623046875, -0.09367752075195312, -0.07776641845703125, -0.061855316162109375, -0.0459442138671875, -0.030033111572265625, -0.01412200927734375, 0.001789093017578125, 0.0177001953125, 0.033611297607421875, 0.04952239990234375, 0.06543350219726562, 0.0813446044921875, 0.09725570678710938, 0.11316680908203125, 0.12907791137695312, 0.144989013671875, 0.16090011596679688, 0.17681121826171875, 0.19272232055664062, 0.2086334228515625, 0.22454452514648438, 0.24045562744140625, 0.2563667297363281, 0.27227783203125, 0.2881889343261719, 0.30410003662109375, 0.3200111389160156, 0.3359222412109375, 0.3518333435058594, 0.36774444580078125, 0.3836555480957031, 0.399566650390625, 0.4154777526855469, 0.43138885498046875, 0.4472999572753906, 0.4632110595703125, 0.4791221618652344, 0.49503326416015625, 0.5109443664550781, 0.52685546875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 12.0, 17.0, 16.0, 19.0, 23.0, 20.0, 23.0, 21.0, 26.0, 32.0, 41.0, 32.0, 35.0, 48.0, 51.0, 53.0, 1063.0, 43.0, 51.0, 41.0, 44.0, 20.0, 45.0, 34.0, 38.0, 22.0, 20.0, 21.0, 17.0, 16.0, 17.0, 12.0, 6.0, 11.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.453125, -3.344146728515625, -3.23516845703125, -3.126190185546875, -3.0172119140625, -2.908233642578125, -2.79925537109375, -2.690277099609375, -2.581298828125, -2.472320556640625, -2.36334228515625, -2.254364013671875, -2.1453857421875, -2.036407470703125, -1.92742919921875, -1.818450927734375, -1.70947265625, -1.600494384765625, -1.49151611328125, -1.382537841796875, -1.2735595703125, -1.164581298828125, -1.05560302734375, -0.946624755859375, -0.837646484375, -0.728668212890625, -0.61968994140625, -0.510711669921875, -0.4017333984375, -0.292755126953125, -0.18377685546875, -0.074798583984375, 0.0341796875, 0.143157958984375, 0.25213623046875, 0.361114501953125, 0.4700927734375, 0.579071044921875, 0.68804931640625, 0.797027587890625, 0.906005859375, 1.014984130859375, 1.12396240234375, 1.232940673828125, 1.3419189453125, 1.450897216796875, 1.55987548828125, 1.668853759765625, 1.77783203125, 1.886810302734375, 1.99578857421875, 2.104766845703125, 2.2137451171875, 2.322723388671875, 2.43170166015625, 2.540679931640625, 2.649658203125, 2.758636474609375, 2.86761474609375, 2.976593017578125, 3.0855712890625, 3.194549560546875, 3.30352783203125, 3.412506103515625, 3.521484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 14.0, 18.0, 17.0, 40.0, 48.0, 102.0, 132.0, 229.0, 363.0, 586.0, 939.0, 1574.0, 2737.0, 4522.0, 8306.0, 14920.0, 27737.0, 51879.0, 98144.0, 171215.0, 1274580.0, 190162.0, 115288.0, 61453.0, 32133.0, 17371.0, 9712.0, 5328.0, 3112.0, 1782.0, 1014.0, 608.0, 386.0, 229.0, 167.0, 106.0, 53.0, 42.0, 32.0, 18.0, 15.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54638671875, -0.530609130859375, -0.51483154296875, -0.499053955078125, -0.4832763671875, -0.467498779296875, -0.45172119140625, -0.435943603515625, -0.420166015625, -0.404388427734375, -0.38861083984375, -0.372833251953125, -0.3570556640625, -0.341278076171875, -0.32550048828125, -0.309722900390625, -0.2939453125, -0.278167724609375, -0.26239013671875, -0.246612548828125, -0.2308349609375, -0.215057373046875, -0.19927978515625, -0.183502197265625, -0.167724609375, -0.151947021484375, -0.13616943359375, -0.120391845703125, -0.1046142578125, -0.088836669921875, -0.07305908203125, -0.057281494140625, -0.04150390625, -0.025726318359375, -0.00994873046875, 0.005828857421875, 0.0216064453125, 0.037384033203125, 0.05316162109375, 0.068939208984375, 0.084716796875, 0.100494384765625, 0.11627197265625, 0.132049560546875, 0.1478271484375, 0.163604736328125, 0.17938232421875, 0.195159912109375, 0.2109375, 0.226715087890625, 0.24249267578125, 0.258270263671875, 0.2740478515625, 0.289825439453125, 0.30560302734375, 0.321380615234375, 0.337158203125, 0.352935791015625, 0.36871337890625, 0.384490966796875, 0.4002685546875, 0.416046142578125, 0.43182373046875, 0.447601318359375, 0.46337890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 8.0, 6.0, 6.0, 8.0, 9.0, 14.0, 18.0, 27.0, 24.0, 25.0, 32.0, 23.0, 44.0, 39.0, 42.0, 61.0, 51.0, 38.0, 44.0, 52.0, 47.0, 50.0, 38.0, 30.0, 41.0, 38.0, 26.0, 26.0, 24.0, 26.0, 12.0, 17.0, 3.0, 14.0, 8.0, 6.0, 6.0, 4.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009899139404296875, -0.0009552240371704102, -0.0009205341339111328, -0.0008858442306518555, -0.0008511543273925781, -0.0008164644241333008, -0.0007817745208740234, -0.0007470846176147461, -0.0007123947143554688, -0.0006777048110961914, -0.0006430149078369141, -0.0006083250045776367, -0.0005736351013183594, -0.000538945198059082, -0.0005042552947998047, -0.00046956539154052734, -0.00043487548828125, -0.00040018558502197266, -0.0003654956817626953, -0.00033080577850341797, -0.0002961158752441406, -0.0002614259719848633, -0.00022673606872558594, -0.0001920461654663086, -0.00015735626220703125, -0.0001226663589477539, -8.797645568847656e-05, -5.328655242919922e-05, -1.8596649169921875e-05, 1.609325408935547e-05, 5.078315734863281e-05, 8.547306060791016e-05, 0.0001201629638671875, 0.00015485286712646484, 0.0001895427703857422, 0.00022423267364501953, 0.0002589225769042969, 0.0002936124801635742, 0.00032830238342285156, 0.0003629922866821289, 0.00039768218994140625, 0.0004323720932006836, 0.00046706199645996094, 0.0005017518997192383, 0.0005364418029785156, 0.000571131706237793, 0.0006058216094970703, 0.0006405115127563477, 0.000675201416015625, 0.0007098913192749023, 0.0007445812225341797, 0.000779271125793457, 0.0008139610290527344, 0.0008486509323120117, 0.0008833408355712891, 0.0009180307388305664, 0.0009527206420898438, 0.000987410545349121, 0.0010221004486083984, 0.0010567903518676758, 0.0010914802551269531, 0.0011261701583862305, 0.0011608600616455078, 0.0011955499649047852, 0.0012302398681640625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 16.0, 13.0, 13.0, 23.0, 19.0, 25.0, 41.0, 49.0, 56.0, 75.0, 107.0, 162.0, 296.0, 733.0, 4219.0, 798189.0, 241150.0, 1930.0, 582.0, 275.0, 136.0, 94.0, 60.0, 63.0, 35.0, 47.0, 21.0, 24.0, 18.0, 11.0, 14.0, 11.0, 10.0, 0.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0264129638671875, -0.025676250457763672, -0.024939537048339844, -0.024202823638916016, -0.023466110229492188, -0.02272939682006836, -0.02199268341064453, -0.021255970001220703, -0.020519256591796875, -0.019782543182373047, -0.01904582977294922, -0.01830911636352539, -0.017572402954101562, -0.016835689544677734, -0.016098976135253906, -0.015362262725830078, -0.01462554931640625, -0.013888835906982422, -0.013152122497558594, -0.012415409088134766, -0.011678695678710938, -0.01094198226928711, -0.010205268859863281, -0.009468555450439453, -0.008731842041015625, -0.007995128631591797, -0.007258415222167969, -0.006521701812744141, -0.0057849884033203125, -0.005048274993896484, -0.004311561584472656, -0.003574848175048828, -0.002838134765625, -0.002101421356201172, -0.0013647079467773438, -0.0006279945373535156, 0.0001087188720703125, 0.0008454322814941406, 0.0015821456909179688, 0.002318859100341797, 0.003055572509765625, 0.003792285919189453, 0.004528999328613281, 0.005265712738037109, 0.0060024261474609375, 0.006739139556884766, 0.007475852966308594, 0.008212566375732422, 0.00894927978515625, 0.009685993194580078, 0.010422706604003906, 0.011159420013427734, 0.011896133422851562, 0.01263284683227539, 0.013369560241699219, 0.014106273651123047, 0.014842987060546875, 0.015579700469970703, 0.01631641387939453, 0.01705312728881836, 0.017789840698242188, 0.018526554107666016, 0.019263267517089844, 0.019999980926513672, 0.0207366943359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 13.0, 23.0, 60.0, 124.0, 146.0, 195.0, 172.0, 128.0, 84.0, 27.0, 15.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001208073110319674, -0.0011610151268541813, -0.0011139571433886886, -0.0010668991599231958, -0.0010198410600423813, -0.0009727830765768886, -0.0009257250931113958, -0.0008786671096459031, -0.0008316090679727495, -0.0007845510845072567, -0.0007374930428341031, -0.0006904350593686104, -0.0006433770759031177, -0.000596319034229964, -0.0005492610507644713, -0.0005022030090913177, -0.00045514502562582493, -0.00040808701305650175, -0.00036102900048717856, -0.00031397101702168584, -0.00026691300445236266, -0.00021985499188303947, -0.00017279700841754675, -0.00012573899584822357, -7.868098327890038e-05, -3.162297798553482e-05, 1.543502730783075e-05, 6.24930253252387e-05, 0.00010955103789456189, 0.00015660905046388507, 0.0002036670339293778, 0.000250725046498701, 0.000297783175483346, 0.00034484118805266917, 0.00039189920062199235, 0.0004389571840874851, 0.00048601519665680826, 0.0005330732092261314, 0.0005801311926916242, 0.0006271891761571169, 0.0006742472178302705, 0.0007213052012957633, 0.0007683632429689169, 0.0008154212264344096, 0.0008624792098999023, 0.000909537251573056, 0.0009565952350385487, 0.0010036532767117023, 0.001050711260177195, 0.0010977692436426878, 0.0011448272271081805, 0.0011918852105736732, 0.0012389433104544878, 0.0012860012939199805, 0.0013330592773854733, 0.001380117260850966, 0.0014271752443164587, 0.0014742332277819514, 0.0015212912112474442, 0.0015683493111282587, 0.0016154072945937514, 0.0016624652780592442, 0.0017095232615247369, 0.0017565812449902296, 0.0018036393448710442]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 5.0, 3.0, 12.0, 13.0, 11.0, 23.0, 18.0, 29.0, 22.0, 30.0, 30.0, 28.0, 31.0, 47.0, 38.0, 50.0, 41.0, 37.0, 35.0, 37.0, 35.0, 37.0, 35.0, 46.0, 27.0, 35.0, 33.0, 35.0, 24.0, 21.0, 20.0, 13.0, 18.0, 9.0, 17.0, 15.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000590980052947998, -0.0005714157596230507, -0.0005518514662981033, -0.000532287172973156, -0.0005127228796482086, -0.0004931585863232613, -0.0004735942929983139, -0.00045402999967336655, -0.0004344657063484192, -0.00041490141302347183, -0.0003953371196985245, -0.0003757728263735771, -0.00035620853304862976, -0.0003366442397236824, -0.00031707994639873505, -0.0002975156530737877, -0.00027795135974884033, -0.000258387066423893, -0.00023882277309894562, -0.00021925847977399826, -0.0001996941864490509, -0.00018012989312410355, -0.0001605655997991562, -0.00014100130647420883, -0.00012143701314926147, -0.00010187271982431412, -8.230842649936676e-05, -6.27441331744194e-05, -4.3179839849472046e-05, -2.361554652452469e-05, -4.0512531995773315e-06, 1.5513040125370026e-05, 3.507733345031738e-05, 5.464162677526474e-05, 7.42059201002121e-05, 9.377021342515945e-05, 0.00011333450675010681, 0.00013289880007505417, 0.00015246309340000153, 0.00017202738672494888, 0.00019159168004989624, 0.0002111559733748436, 0.00023072026669979095, 0.0002502845600247383, 0.00026984885334968567, 0.000289413146674633, 0.0003089774399995804, 0.00032854173332452774, 0.0003481060266494751, 0.00036767031997442245, 0.0003872346132993698, 0.00040679890662431717, 0.0004263631999492645, 0.0004459274932742119, 0.00046549178659915924, 0.0004850560799241066, 0.000504620373249054, 0.0005241846665740013, 0.0005437489598989487, 0.000563313253223896, 0.0005828775465488434, 0.0006024418398737907, 0.0006220061331987381, 0.0006415704265236855, 0.0006611347198486328]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 12.0, 9.0, 20.0, 13.0, 21.0, 15.0, 28.0, 25.0, 22.0, 23.0, 36.0, 36.0, 41.0, 32.0, 41.0, 40.0, 44.0, 40.0, 40.0, 44.0, 34.0, 31.0, 30.0, 38.0, 32.0, 25.0, 28.0, 25.0, 27.0, 21.0, 19.0, 18.0, 9.0, 10.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-5.16796875, -5.01397705078125, -4.8599853515625, -4.70599365234375, -4.552001953125, -4.39801025390625, -4.2440185546875, -4.09002685546875, -3.93603515625, -3.78204345703125, -3.6280517578125, -3.47406005859375, -3.320068359375, -3.16607666015625, -3.0120849609375, -2.85809326171875, -2.7041015625, -2.55010986328125, -2.3961181640625, -2.24212646484375, -2.088134765625, -1.93414306640625, -1.7801513671875, -1.62615966796875, -1.47216796875, -1.31817626953125, -1.1641845703125, -1.01019287109375, -0.856201171875, -0.70220947265625, -0.5482177734375, -0.39422607421875, -0.240234375, -0.08624267578125, 0.0677490234375, 0.22174072265625, 0.375732421875, 0.52972412109375, 0.6837158203125, 0.83770751953125, 0.99169921875, 1.14569091796875, 1.2996826171875, 1.45367431640625, 1.607666015625, 1.76165771484375, 1.9156494140625, 2.06964111328125, 2.2236328125, 2.37762451171875, 2.5316162109375, 2.68560791015625, 2.839599609375, 2.99359130859375, 3.1475830078125, 3.30157470703125, 3.45556640625, 3.60955810546875, 3.7635498046875, 3.91754150390625, 4.071533203125, 4.22552490234375, 4.3795166015625, 4.53350830078125, 4.6875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 6.0, 16.0, 24.0, 30.0, 43.0, 56.0, 102.0, 148.0, 201.0, 320.0, 543.0, 909.0, 1535.0, 2619.0, 4830.0, 9181.0, 17613.0, 34573.0, 71833.0, 156811.0, 348403.0, 212714.0, 93598.0, 44808.0, 22052.0, 11497.0, 6004.0, 3341.0, 1827.0, 1061.0, 646.0, 416.0, 290.0, 146.0, 98.0, 77.0, 44.0, 38.0, 29.0, 21.0, 9.0, 11.0, 5.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.00390625, -3.881378173828125, -3.75885009765625, -3.636322021484375, -3.5137939453125, -3.391265869140625, -3.26873779296875, -3.146209716796875, -3.023681640625, -2.901153564453125, -2.77862548828125, -2.656097412109375, -2.5335693359375, -2.411041259765625, -2.28851318359375, -2.165985107421875, -2.04345703125, -1.920928955078125, -1.79840087890625, -1.675872802734375, -1.5533447265625, -1.430816650390625, -1.30828857421875, -1.185760498046875, -1.063232421875, -0.940704345703125, -0.81817626953125, -0.695648193359375, -0.5731201171875, -0.450592041015625, -0.32806396484375, -0.205535888671875, -0.0830078125, 0.039520263671875, 0.16204833984375, 0.284576416015625, 0.4071044921875, 0.529632568359375, 0.65216064453125, 0.774688720703125, 0.897216796875, 1.019744873046875, 1.14227294921875, 1.264801025390625, 1.3873291015625, 1.509857177734375, 1.63238525390625, 1.754913330078125, 1.87744140625, 1.999969482421875, 2.12249755859375, 2.245025634765625, 2.3675537109375, 2.490081787109375, 2.61260986328125, 2.735137939453125, 2.857666015625, 2.980194091796875, 3.10272216796875, 3.225250244140625, 3.3477783203125, 3.470306396484375, 3.59283447265625, 3.715362548828125, 3.837890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 13.0, 7.0, 13.0, 18.0, 22.0, 19.0, 23.0, 33.0, 28.0, 38.0, 40.0, 33.0, 54.0, 47.0, 68.0, 106.0, 292.0, 1524.0, 162.0, 93.0, 61.0, 45.0, 40.0, 35.0, 32.0, 21.0, 25.0, 22.0, 18.0, 25.0, 15.0, 14.0, 14.0, 9.0, 10.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-19.5625, -18.990478515625, -18.41845703125, -17.846435546875, -17.2744140625, -16.702392578125, -16.13037109375, -15.558349609375, -14.986328125, -14.414306640625, -13.84228515625, -13.270263671875, -12.6982421875, -12.126220703125, -11.55419921875, -10.982177734375, -10.41015625, -9.838134765625, -9.26611328125, -8.694091796875, -8.1220703125, -7.550048828125, -6.97802734375, -6.406005859375, -5.833984375, -5.261962890625, -4.68994140625, -4.117919921875, -3.5458984375, -2.973876953125, -2.40185546875, -1.829833984375, -1.2578125, -0.685791015625, -0.11376953125, 0.458251953125, 1.0302734375, 1.602294921875, 2.17431640625, 2.746337890625, 3.318359375, 3.890380859375, 4.46240234375, 5.034423828125, 5.6064453125, 6.178466796875, 6.75048828125, 7.322509765625, 7.89453125, 8.466552734375, 9.03857421875, 9.610595703125, 10.1826171875, 10.754638671875, 11.32666015625, 11.898681640625, 12.470703125, 13.042724609375, 13.61474609375, 14.186767578125, 14.7587890625, 15.330810546875, 15.90283203125, 16.474853515625, 17.046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 1.0, 1.0, 6.0, 9.0, 22.0, 42.0, 58.0, 68.0, 116.0, 192.0, 341.0, 743.0, 11755.0, 3127015.0, 3925.0, 627.0, 297.0, 175.0, 106.0, 69.0, 64.0, 25.0, 19.0, 16.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.75, -70.275390625, -67.80078125, -65.326171875, -62.8515625, -60.376953125, -57.90234375, -55.427734375, -52.953125, -50.478515625, -48.00390625, -45.529296875, -43.0546875, -40.580078125, -38.10546875, -35.630859375, -33.15625, -30.681640625, -28.20703125, -25.732421875, -23.2578125, -20.783203125, -18.30859375, -15.833984375, -13.359375, -10.884765625, -8.41015625, -5.935546875, -3.4609375, -0.986328125, 1.48828125, 3.962890625, 6.4375, 8.912109375, 11.38671875, 13.861328125, 16.3359375, 18.810546875, 21.28515625, 23.759765625, 26.234375, 28.708984375, 31.18359375, 33.658203125, 36.1328125, 38.607421875, 41.08203125, 43.556640625, 46.03125, 48.505859375, 50.98046875, 53.455078125, 55.9296875, 58.404296875, 60.87890625, 63.353515625, 65.828125, 68.302734375, 70.77734375, 73.251953125, 75.7265625, 78.201171875, 80.67578125, 83.150390625, 85.625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 12.0, 152.0, 398.0, 355.0, 80.0, 16.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.663169860839844, -44.051605224609375, -41.440040588378906, -38.82847595214844, -36.21691131591797, -33.6053466796875, -30.993785858154297, -28.382221221923828, -25.77065658569336, -23.15909194946289, -20.547527313232422, -17.935964584350586, -15.324399948120117, -12.712835311889648, -10.101271629333496, -7.489707946777344, -4.878143310546875, -2.2665791511535645, 0.3449850082397461, 2.9565491676330566, 5.568113327026367, 8.179677963256836, 10.791241645812988, 13.40280532836914, 16.01436996459961, 18.625934600830078, 21.237499237060547, 23.849061965942383, 26.46062660217285, 29.07219123840332, 31.683753967285156, 34.295318603515625, 36.90687561035156, 39.51844024658203, 42.1300048828125, 44.74156951904297, 47.35313415527344, 49.964698791503906, 52.57625961303711, 55.18782424926758, 57.79938888549805, 60.410953521728516, 63.022518157958984, 65.63407897949219, 68.24564361572266, 70.85720825195312, 73.4687728881836, 76.08033752441406, 78.69190216064453, 81.303466796875, 83.91503143310547, 86.52659606933594, 89.1381607055664, 91.74972534179688, 94.36128997802734, 96.97285461425781, 99.58441162109375, 102.19597625732422, 104.80754089355469, 107.41910552978516, 110.03067016601562, 112.6422348022461, 115.25379943847656, 117.8653564453125, 120.4769287109375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 4.0, 6.0, 12.0, 17.0, 17.0, 38.0, 34.0, 36.0, 23.0, 38.0, 41.0, 52.0, 41.0, 49.0, 53.0, 43.0, 33.0, 39.0, 50.0, 44.0, 55.0, 37.0, 28.0, 33.0, 28.0, 30.0, 15.0, 19.0, 12.0, 13.0, 4.0, 15.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.79033660888672, -60.953773498535156, -59.11720657348633, -57.280643463134766, -55.4440803527832, -53.607513427734375, -51.77095031738281, -49.93438720703125, -48.09782409667969, -46.261260986328125, -44.4246940612793, -42.588130950927734, -40.75156784057617, -38.915000915527344, -37.07843780517578, -35.24187469482422, -33.405311584472656, -31.56874656677246, -29.7321834564209, -27.895618438720703, -26.05905532836914, -24.222490310668945, -22.38592529296875, -20.549362182617188, -18.71279525756836, -16.876230239868164, -15.039667129516602, -13.203102111816406, -11.366539001464844, -9.529973983764648, -7.6934099197387695, -5.856845855712891, -4.020282745361328, -2.183718681335449, -0.3471543788909912, 1.4894099235534668, 3.3259739875793457, 5.162538528442383, 6.999102592468262, 8.83566665649414, 10.67223072052002, 12.508794784545898, 14.345358848571777, 16.181922912597656, 18.01848793029785, 19.855052947998047, 21.69161605834961, 23.528179168701172, 25.364744186401367, 27.201309204101562, 29.037872314453125, 30.87443733215332, 32.711002349853516, 34.54756546020508, 36.38412857055664, 38.22069549560547, 40.05725860595703, 41.893821716308594, 43.73038864135742, 45.566951751708984, 47.40351486206055, 49.240081787109375, 51.07664489746094, 52.9132080078125, 54.74977111816406]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 14.0, 7.0, 8.0, 11.0, 18.0, 18.0, 15.0, 19.0, 28.0, 26.0, 28.0, 35.0, 44.0, 36.0, 28.0, 31.0, 40.0, 48.0, 37.0, 41.0, 45.0, 39.0, 35.0, 33.0, 32.0, 25.0, 40.0, 28.0, 26.0, 26.0, 18.0, 19.0, 20.0, 12.0, 10.0, 7.0, 10.0, 6.0, 6.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.3359375, -5.1685791015625, -5.001220703125, -4.8338623046875, -4.66650390625, -4.4991455078125, -4.331787109375, -4.1644287109375, -3.9970703125, -3.8297119140625, -3.662353515625, -3.4949951171875, -3.32763671875, -3.1602783203125, -2.992919921875, -2.8255615234375, -2.658203125, -2.4908447265625, -2.323486328125, -2.1561279296875, -1.98876953125, -1.8214111328125, -1.654052734375, -1.4866943359375, -1.3193359375, -1.1519775390625, -0.984619140625, -0.8172607421875, -0.64990234375, -0.4825439453125, -0.315185546875, -0.1478271484375, 0.01953125, 0.1868896484375, 0.354248046875, 0.5216064453125, 0.68896484375, 0.8563232421875, 1.023681640625, 1.1910400390625, 1.3583984375, 1.5257568359375, 1.693115234375, 1.8604736328125, 2.02783203125, 2.1951904296875, 2.362548828125, 2.5299072265625, 2.697265625, 2.8646240234375, 3.031982421875, 3.1993408203125, 3.36669921875, 3.5340576171875, 3.701416015625, 3.8687744140625, 4.0361328125, 4.2034912109375, 4.370849609375, 4.5382080078125, 4.70556640625, 4.8729248046875, 5.040283203125, 5.2076416015625, 5.375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 6.0, 10.0, 12.0, 9.0, 16.0, 20.0, 19.0, 24.0, 33.0, 25.0, 49.0, 78.0, 149.0, 344.0, 1195.0, 6902.0, 114360.0, 2591100.0, 1431799.0, 43076.0, 3619.0, 769.0, 250.0, 116.0, 56.0, 36.0, 34.0, 23.0, 26.0, 21.0, 14.0, 19.0, 14.0, 8.0, 10.0, 3.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.328125, -18.721435546875, -18.11474609375, -17.508056640625, -16.9013671875, -16.294677734375, -15.68798828125, -15.081298828125, -14.474609375, -13.867919921875, -13.26123046875, -12.654541015625, -12.0478515625, -11.441162109375, -10.83447265625, -10.227783203125, -9.62109375, -9.014404296875, -8.40771484375, -7.801025390625, -7.1943359375, -6.587646484375, -5.98095703125, -5.374267578125, -4.767578125, -4.160888671875, -3.55419921875, -2.947509765625, -2.3408203125, -1.734130859375, -1.12744140625, -0.520751953125, 0.0859375, 0.692626953125, 1.29931640625, 1.906005859375, 2.5126953125, 3.119384765625, 3.72607421875, 4.332763671875, 4.939453125, 5.546142578125, 6.15283203125, 6.759521484375, 7.3662109375, 7.972900390625, 8.57958984375, 9.186279296875, 9.79296875, 10.399658203125, 11.00634765625, 11.613037109375, 12.2197265625, 12.826416015625, 13.43310546875, 14.039794921875, 14.646484375, 15.253173828125, 15.85986328125, 16.466552734375, 17.0732421875, 17.679931640625, 18.28662109375, 18.893310546875, 19.5]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 15.0, 20.0, 13.0, 24.0, 33.0, 43.0, 55.0, 87.0, 90.0, 140.0, 179.0, 229.0, 276.0, 367.0, 387.0, 379.0, 381.0, 304.0, 237.0, 174.0, 156.0, 94.0, 95.0, 59.0, 54.0, 40.0, 34.0, 30.0, 16.0, 14.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.966064453125, -9.63525390625, -9.304443359375, -8.9736328125, -8.642822265625, -8.31201171875, -7.981201171875, -7.650390625, -7.319580078125, -6.98876953125, -6.657958984375, -6.3271484375, -5.996337890625, -5.66552734375, -5.334716796875, -5.00390625, -4.673095703125, -4.34228515625, -4.011474609375, -3.6806640625, -3.349853515625, -3.01904296875, -2.688232421875, -2.357421875, -2.026611328125, -1.69580078125, -1.364990234375, -1.0341796875, -0.703369140625, -0.37255859375, -0.041748046875, 0.2890625, 0.619873046875, 0.95068359375, 1.281494140625, 1.6123046875, 1.943115234375, 2.27392578125, 2.604736328125, 2.935546875, 3.266357421875, 3.59716796875, 3.927978515625, 4.2587890625, 4.589599609375, 4.92041015625, 5.251220703125, 5.58203125, 5.912841796875, 6.24365234375, 6.574462890625, 6.9052734375, 7.236083984375, 7.56689453125, 7.897705078125, 8.228515625, 8.559326171875, 8.89013671875, 9.220947265625, 9.5517578125, 9.882568359375, 10.21337890625, 10.544189453125, 10.875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 5.0, 6.0, 4.0, 6.0, 4.0, 11.0, 19.0, 17.0, 34.0, 43.0, 43.0, 53.0, 69.0, 101.0, 103.0, 155.0, 171.0, 232.0, 299.0, 579.0, 2046.0, 45833.0, 3377302.0, 754412.0, 10101.0, 1034.0, 398.0, 268.0, 214.0, 123.0, 110.0, 100.0, 90.0, 58.0, 45.0, 47.0, 38.0, 27.0, 15.0, 12.0, 17.0, 10.0, 13.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-38.75, -37.603515625, -36.45703125, -35.310546875, -34.1640625, -33.017578125, -31.87109375, -30.724609375, -29.578125, -28.431640625, -27.28515625, -26.138671875, -24.9921875, -23.845703125, -22.69921875, -21.552734375, -20.40625, -19.259765625, -18.11328125, -16.966796875, -15.8203125, -14.673828125, -13.52734375, -12.380859375, -11.234375, -10.087890625, -8.94140625, -7.794921875, -6.6484375, -5.501953125, -4.35546875, -3.208984375, -2.0625, -0.916015625, 0.23046875, 1.376953125, 2.5234375, 3.669921875, 4.81640625, 5.962890625, 7.109375, 8.255859375, 9.40234375, 10.548828125, 11.6953125, 12.841796875, 13.98828125, 15.134765625, 16.28125, 17.427734375, 18.57421875, 19.720703125, 20.8671875, 22.013671875, 23.16015625, 24.306640625, 25.453125, 26.599609375, 27.74609375, 28.892578125, 30.0390625, 31.185546875, 32.33203125, 33.478515625, 34.625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 17.0, 182.0, 455.0, 311.0, 48.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.1879577636719, -259.6512145996094, -253.11444091796875, -246.57769775390625, -240.0409393310547, -233.50418090820312, -226.96742248535156, -220.4306640625, -213.8939208984375, -207.35716247558594, -200.82040405273438, -194.28366088867188, -187.7469024658203, -181.21014404296875, -174.6733856201172, -168.13662719726562, -161.59986877441406, -155.0631103515625, -148.52635192871094, -141.98959350585938, -135.45285034179688, -128.9160919189453, -122.37933349609375, -115.84257507324219, -109.30582427978516, -102.7690658569336, -96.23231506347656, -89.695556640625, -83.15879821777344, -76.6220474243164, -70.08528900146484, -63.54853439331055, -57.01176452636719, -50.47500991821289, -43.938255310058594, -37.40149688720703, -30.864742279052734, -24.327987670898438, -17.791229248046875, -11.254474639892578, -4.717720031738281, 1.819035530090332, 8.355791091918945, 14.892547607421875, 21.429302215576172, 27.96605682373047, 34.50281524658203, 41.03956985473633, 47.576324462890625, 54.11307907104492, 60.64983367919922, 67.18659210205078, 73.72334289550781, 80.26010131835938, 86.79685974121094, 93.3336181640625, 99.87036895751953, 106.4071273803711, 112.94387817382812, 119.48063659667969, 126.01739501953125, 132.55413818359375, 139.09091186523438, 145.62765502929688, 152.16441345214844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 11.0, 2.0, 9.0, 12.0, 11.0, 14.0, 20.0, 23.0, 15.0, 24.0, 33.0, 35.0, 32.0, 35.0, 36.0, 33.0, 37.0, 35.0, 33.0, 33.0, 38.0, 49.0, 29.0, 40.0, 30.0, 30.0, 42.0, 33.0, 27.0, 32.0, 23.0, 19.0, 16.0, 16.0, 17.0, 21.0, 10.0, 10.0, 10.0, 2.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.9398193359375, -31.855924606323242, -30.772029876708984, -29.688135147094727, -28.60424041748047, -27.52034568786621, -26.436450958251953, -25.352556228637695, -24.268661499023438, -23.18476676940918, -22.100872039794922, -21.016977310180664, -19.933082580566406, -18.84918785095215, -17.76529312133789, -16.681398391723633, -15.597503662109375, -14.513608932495117, -13.42971420288086, -12.345819473266602, -11.261924743652344, -10.178030014038086, -9.094135284423828, -8.01024055480957, -6.9263458251953125, -5.842451095581055, -4.758556365966797, -3.674661636352539, -2.5907669067382812, -1.5068721771240234, -0.4229774475097656, 0.6609172821044922, 1.74481201171875, 2.828706741333008, 3.9126014709472656, 4.996496200561523, 6.080390930175781, 7.164285659790039, 8.248180389404297, 9.332075119018555, 10.415969848632812, 11.49986457824707, 12.583759307861328, 13.667654037475586, 14.751548767089844, 15.835443496704102, 16.91933822631836, 18.003232955932617, 19.087127685546875, 20.171022415161133, 21.25491714477539, 22.33881187438965, 23.422706604003906, 24.506601333618164, 25.590496063232422, 26.67439079284668, 27.758285522460938, 28.842180252075195, 29.926074981689453, 31.00996971130371, 32.09386444091797, 33.177757263183594, 34.261653900146484, 35.345550537109375, 36.429443359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 13.0, 17.0, 9.0, 17.0, 17.0, 21.0, 21.0, 39.0, 26.0, 21.0, 35.0, 43.0, 41.0, 39.0, 42.0, 48.0, 36.0, 45.0, 34.0, 46.0, 51.0, 37.0, 36.0, 29.0, 25.0, 29.0, 22.0, 26.0, 26.0, 22.0, 13.0, 14.0, 5.0, 7.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1875, -5.01373291015625, -4.8399658203125, -4.66619873046875, -4.492431640625, -4.31866455078125, -4.1448974609375, -3.97113037109375, -3.79736328125, -3.62359619140625, -3.4498291015625, -3.27606201171875, -3.102294921875, -2.92852783203125, -2.7547607421875, -2.58099365234375, -2.4072265625, -2.23345947265625, -2.0596923828125, -1.88592529296875, -1.712158203125, -1.53839111328125, -1.3646240234375, -1.19085693359375, -1.01708984375, -0.84332275390625, -0.6695556640625, -0.49578857421875, -0.322021484375, -0.14825439453125, 0.0255126953125, 0.19927978515625, 0.373046875, 0.54681396484375, 0.7205810546875, 0.89434814453125, 1.068115234375, 1.24188232421875, 1.4156494140625, 1.58941650390625, 1.76318359375, 1.93695068359375, 2.1107177734375, 2.28448486328125, 2.458251953125, 2.63201904296875, 2.8057861328125, 2.97955322265625, 3.1533203125, 3.32708740234375, 3.5008544921875, 3.67462158203125, 3.848388671875, 4.02215576171875, 4.1959228515625, 4.36968994140625, 4.54345703125, 4.71722412109375, 4.8909912109375, 5.06475830078125, 5.238525390625, 5.41229248046875, 5.5860595703125, 5.75982666015625, 5.93359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 10.0, 22.0, 23.0, 32.0, 76.0, 118.0, 136.0, 212.0, 357.0, 509.0, 734.0, 1085.0, 1716.0, 2566.0, 3966.0, 6466.0, 10201.0, 16058.0, 26370.0, 43636.0, 71987.0, 118230.0, 178845.0, 196265.0, 141779.0, 88579.0, 52734.0, 32201.0, 19699.0, 12395.0, 7534.0, 4905.0, 3084.0, 2109.0, 1289.0, 864.0, 582.0, 379.0, 242.0, 168.0, 135.0, 82.0, 62.0, 40.0, 30.0, 11.0, 12.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.60791015625, -0.589599609375, -0.5712890625, -0.552978515625, -0.53466796875, -0.516357421875, -0.498046875, -0.479736328125, -0.46142578125, -0.443115234375, -0.4248046875, -0.406494140625, -0.38818359375, -0.369873046875, -0.3515625, -0.333251953125, -0.31494140625, -0.296630859375, -0.2783203125, -0.260009765625, -0.24169921875, -0.223388671875, -0.205078125, -0.186767578125, -0.16845703125, -0.150146484375, -0.1318359375, -0.113525390625, -0.09521484375, -0.076904296875, -0.05859375, -0.040283203125, -0.02197265625, -0.003662109375, 0.0146484375, 0.032958984375, 0.05126953125, 0.069580078125, 0.087890625, 0.106201171875, 0.12451171875, 0.142822265625, 0.1611328125, 0.179443359375, 0.19775390625, 0.216064453125, 0.234375, 0.252685546875, 0.27099609375, 0.289306640625, 0.3076171875, 0.325927734375, 0.34423828125, 0.362548828125, 0.380859375, 0.399169921875, 0.41748046875, 0.435791015625, 0.4541015625, 0.472412109375, 0.49072265625, 0.509033203125, 0.52734375, 0.545654296875, 0.56396484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 7.0, 10.0, 13.0, 17.0, 16.0, 20.0, 24.0, 35.0, 37.0, 39.0, 41.0, 37.0, 60.0, 59.0, 42.0, 1083.0, 60.0, 54.0, 58.0, 44.0, 40.0, 36.0, 25.0, 33.0, 24.0, 21.0, 12.0, 22.0, 17.0, 10.0, 3.0, 11.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.966796875, -3.828643798828125, -3.69049072265625, -3.552337646484375, -3.4141845703125, -3.276031494140625, -3.13787841796875, -2.999725341796875, -2.861572265625, -2.723419189453125, -2.58526611328125, -2.447113037109375, -2.3089599609375, -2.170806884765625, -2.03265380859375, -1.894500732421875, -1.75634765625, -1.618194580078125, -1.48004150390625, -1.341888427734375, -1.2037353515625, -1.065582275390625, -0.92742919921875, -0.789276123046875, -0.651123046875, -0.512969970703125, -0.37481689453125, -0.236663818359375, -0.0985107421875, 0.039642333984375, 0.17779541015625, 0.315948486328125, 0.4541015625, 0.592254638671875, 0.73040771484375, 0.868560791015625, 1.0067138671875, 1.144866943359375, 1.28302001953125, 1.421173095703125, 1.559326171875, 1.697479248046875, 1.83563232421875, 1.973785400390625, 2.1119384765625, 2.250091552734375, 2.38824462890625, 2.526397705078125, 2.66455078125, 2.802703857421875, 2.94085693359375, 3.079010009765625, 3.2171630859375, 3.355316162109375, 3.49346923828125, 3.631622314453125, 3.769775390625, 3.907928466796875, 4.04608154296875, 4.184234619140625, 4.3223876953125, 4.460540771484375, 4.59869384765625, 4.736846923828125, 4.875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 15.0, 17.0, 28.0, 54.0, 63.0, 83.0, 153.0, 233.0, 349.0, 511.0, 787.0, 1240.0, 1900.0, 3017.0, 4819.0, 7949.0, 13199.0, 21750.0, 37568.0, 64881.0, 109205.0, 168257.0, 1248974.0, 161056.0, 102894.0, 60427.0, 34760.0, 20695.0, 12102.0, 7580.0, 4587.0, 2909.0, 1778.0, 1170.0, 725.0, 464.0, 292.0, 206.0, 145.0, 85.0, 56.0, 39.0, 37.0, 23.0, 17.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.449462890625, -0.4351654052734375, -0.420867919921875, -0.4065704345703125, -0.39227294921875, -0.3779754638671875, -0.363677978515625, -0.3493804931640625, -0.3350830078125, -0.3207855224609375, -0.306488037109375, -0.2921905517578125, -0.27789306640625, -0.2635955810546875, -0.249298095703125, -0.2350006103515625, -0.220703125, -0.2064056396484375, -0.192108154296875, -0.1778106689453125, -0.16351318359375, -0.1492156982421875, -0.134918212890625, -0.1206207275390625, -0.1063232421875, -0.0920257568359375, -0.077728271484375, -0.0634307861328125, -0.04913330078125, -0.0348358154296875, -0.020538330078125, -0.0062408447265625, 0.008056640625, 0.0223541259765625, 0.036651611328125, 0.0509490966796875, 0.06524658203125, 0.0795440673828125, 0.093841552734375, 0.1081390380859375, 0.1224365234375, 0.1367340087890625, 0.151031494140625, 0.1653289794921875, 0.17962646484375, 0.1939239501953125, 0.208221435546875, 0.2225189208984375, 0.23681640625, 0.2511138916015625, 0.265411376953125, 0.2797088623046875, 0.29400634765625, 0.3083038330078125, 0.322601318359375, 0.3368988037109375, 0.3511962890625, 0.3654937744140625, 0.379791259765625, 0.3940887451171875, 0.40838623046875, 0.4226837158203125, 0.436981201171875, 0.4512786865234375, 0.465576171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 9.0, 8.0, 7.0, 13.0, 18.0, 24.0, 21.0, 20.0, 36.0, 27.0, 34.0, 40.0, 60.0, 52.0, 39.0, 56.0, 48.0, 65.0, 44.0, 54.0, 43.0, 43.0, 34.0, 38.0, 27.0, 24.0, 22.0, 16.0, 16.0, 13.0, 8.0, 3.0, 7.0, 3.0, 6.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014190673828125, -0.0013776421546936035, -0.001336216926574707, -0.0012947916984558105, -0.001253366470336914, -0.0012119412422180176, -0.001170516014099121, -0.0011290907859802246, -0.0010876655578613281, -0.0010462403297424316, -0.0010048151016235352, -0.0009633898735046387, -0.0009219646453857422, -0.0008805394172668457, -0.0008391141891479492, -0.0007976889610290527, -0.0007562637329101562, -0.0007148385047912598, -0.0006734132766723633, -0.0006319880485534668, -0.0005905628204345703, -0.0005491375923156738, -0.0005077123641967773, -0.00046628713607788086, -0.0004248619079589844, -0.0003834366798400879, -0.0003420114517211914, -0.0003005862236022949, -0.00025916099548339844, -0.00021773576736450195, -0.00017631053924560547, -0.00013488531112670898, -9.34600830078125e-05, -5.2034854888916016e-05, -1.0609626770019531e-05, 3.081560134887695e-05, 7.224082946777344e-05, 0.00011366605758666992, 0.0001550912857055664, 0.0001965165138244629, 0.00023794174194335938, 0.00027936697006225586, 0.00032079219818115234, 0.00036221742630004883, 0.0004036426544189453, 0.0004450678825378418, 0.0004864931106567383, 0.0005279183387756348, 0.0005693435668945312, 0.0006107687950134277, 0.0006521940231323242, 0.0006936192512512207, 0.0007350444793701172, 0.0007764697074890137, 0.0008178949356079102, 0.0008593201637268066, 0.0009007453918457031, 0.0009421706199645996, 0.000983595848083496, 0.0010250210762023926, 0.001066446304321289, 0.0011078715324401855, 0.001149296760559082, 0.0011907219886779785, 0.001232147216796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 8.0, 5.0, 8.0, 14.0, 16.0, 14.0, 25.0, 25.0, 34.0, 45.0, 44.0, 64.0, 102.0, 168.0, 298.0, 762.0, 8681.0, 1004566.0, 31722.0, 959.0, 361.0, 156.0, 116.0, 68.0, 56.0, 60.0, 34.0, 32.0, 23.0, 25.0, 15.0, 4.0, 11.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0263214111328125, -0.025432348251342773, -0.024543285369873047, -0.02365422248840332, -0.022765159606933594, -0.021876096725463867, -0.02098703384399414, -0.020097970962524414, -0.019208908081054688, -0.01831984519958496, -0.017430782318115234, -0.016541719436645508, -0.01565265655517578, -0.014763593673706055, -0.013874530792236328, -0.012985467910766602, -0.012096405029296875, -0.011207342147827148, -0.010318279266357422, -0.009429216384887695, -0.008540153503417969, -0.007651090621948242, -0.006762027740478516, -0.005872964859008789, -0.0049839019775390625, -0.004094839096069336, -0.0032057762145996094, -0.002316713333129883, -0.0014276504516601562, -0.0005385875701904297, 0.0003504753112792969, 0.0012395381927490234, 0.00212860107421875, 0.0030176639556884766, 0.003906726837158203, 0.00479578971862793, 0.005684852600097656, 0.006573915481567383, 0.007462978363037109, 0.008352041244506836, 0.009241104125976562, 0.010130167007446289, 0.011019229888916016, 0.011908292770385742, 0.012797355651855469, 0.013686418533325195, 0.014575481414794922, 0.015464544296264648, 0.016353607177734375, 0.0172426700592041, 0.018131732940673828, 0.019020795822143555, 0.01990985870361328, 0.020798921585083008, 0.021687984466552734, 0.02257704734802246, 0.023466110229492188, 0.024355173110961914, 0.02524423599243164, 0.026133298873901367, 0.027022361755371094, 0.02791142463684082, 0.028800487518310547, 0.029689550399780273, 0.03057861328125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 43.0, 242.0, 519.0, 175.0, 29.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005974913015961647, -0.005827170796692371, -0.005679429043084383, -0.005531686823815107, -0.005383944604545832, -0.005236202850937843, -0.005088460631668568, -0.004940718412399292, -0.004792976193130016, -0.004645233973860741, -0.004497492220252752, -0.004349750000983477, -0.004202007781714201, -0.004054266028106213, -0.003906523808836937, -0.0037587815895676613, -0.003611039835959673, -0.003463297849521041, -0.0033155556302517653, -0.0031678136438131332, -0.0030200714245438576, -0.0028723294381052256, -0.0027245874516665936, -0.002576845232397318, -0.002429103245958686, -0.002281361259520054, -0.002133619040250778, -0.001985877053812146, -0.0018381349509581923, -0.0016903928481042385, -0.0015426508616656065, -0.0013949087588116527, -0.0012471671216189861, -0.0010994250187650323, -0.0009516829741187394, -0.0008039409294724464, -0.0006561988266184926, -0.0005084567237645388, -0.00036071467911824584, -0.00021297263447195292, -6.523053161799908e-05, 8.25115421321243e-05, 0.00023025361588224769, 0.00037799568963237107, 0.0005257377633824944, 0.0006734798662364483, 0.0008212219108827412, 0.0009689639555290341, 0.001116706058382988, 0.0012644481612369418, 0.0014121902640908957, 0.0015599322505295277, 0.0017076743533834815, 0.0018554164562374353, 0.0020031584426760674, 0.002150900661945343, 0.002298642648383975, 0.002446384634822607, 0.0025941268540918827, 0.0027418688405305147, 0.0028896108269691467, 0.0030373530462384224, 0.0031850950326770544, 0.0033328370191156864, 0.003480579238384962]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 5.0, 7.0, 11.0, 7.0, 14.0, 9.0, 17.0, 22.0, 11.0, 16.0, 17.0, 19.0, 29.0, 21.0, 30.0, 34.0, 28.0, 44.0, 30.0, 42.0, 45.0, 47.0, 31.0, 47.0, 36.0, 20.0, 36.0, 43.0, 39.0, 20.0, 27.0, 20.0, 17.0, 10.0, 21.0, 13.0, 18.0, 14.0, 13.0, 14.0, 11.0, 6.0, 10.0, 6.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0006487369537353516, -0.0006285011768341064, -0.0006082653999328613, -0.0005880296230316162, -0.0005677938461303711, -0.000547558069229126, -0.0005273222923278809, -0.0005070865154266357, -0.0004868507385253906, -0.0004666149616241455, -0.0004463791847229004, -0.0004261434078216553, -0.00040590763092041016, -0.00038567185401916504, -0.0003654360771179199, -0.0003452003002166748, -0.0003249645233154297, -0.00030472874641418457, -0.00028449296951293945, -0.00026425719261169434, -0.00024402141571044922, -0.0002237856388092041, -0.00020354986190795898, -0.00018331408500671387, -0.00016307830810546875, -0.00014284253120422363, -0.00012260675430297852, -0.0001023709774017334, -8.213520050048828e-05, -6.189942359924316e-05, -4.166364669799805e-05, -2.142786979675293e-05, -1.1920928955078125e-06, 1.9043684005737305e-05, 3.927946090698242e-05, 5.951523780822754e-05, 7.975101470947266e-05, 9.998679161071777e-05, 0.00012022256851196289, 0.000140458345413208, 0.00016069412231445312, 0.00018092989921569824, 0.00020116567611694336, 0.00022140145301818848, 0.0002416372299194336, 0.0002618730068206787, 0.00028210878372192383, 0.00030234456062316895, 0.00032258033752441406, 0.0003428161144256592, 0.0003630518913269043, 0.0003832876682281494, 0.00040352344512939453, 0.00042375922203063965, 0.00044399499893188477, 0.0004642307758331299, 0.000484466552734375, 0.0005047023296356201, 0.0005249381065368652, 0.0005451738834381104, 0.0005654096603393555, 0.0005856454372406006, 0.0006058812141418457, 0.0006261169910430908, 0.0006463527679443359]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 14.0, 17.0, 9.0, 17.0, 17.0, 21.0, 21.0, 39.0, 26.0, 21.0, 35.0, 43.0, 41.0, 39.0, 42.0, 48.0, 36.0, 45.0, 34.0, 46.0, 51.0, 37.0, 36.0, 29.0, 25.0, 29.0, 22.0, 26.0, 26.0, 22.0, 13.0, 14.0, 5.0, 7.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1875, -5.01373291015625, -4.8399658203125, -4.66619873046875, -4.492431640625, -4.31866455078125, -4.1448974609375, -3.97113037109375, -3.79736328125, -3.62359619140625, -3.4498291015625, -3.27606201171875, -3.102294921875, -2.92852783203125, -2.7547607421875, -2.58099365234375, -2.4072265625, -2.23345947265625, -2.0596923828125, -1.88592529296875, -1.712158203125, -1.53839111328125, -1.3646240234375, -1.19085693359375, -1.01708984375, -0.84332275390625, -0.6695556640625, -0.49578857421875, -0.322021484375, -0.14825439453125, 0.0255126953125, 0.19927978515625, 0.373046875, 0.54681396484375, 0.7205810546875, 0.89434814453125, 1.068115234375, 1.24188232421875, 1.4156494140625, 1.58941650390625, 1.76318359375, 1.93695068359375, 2.1107177734375, 2.28448486328125, 2.458251953125, 2.63201904296875, 2.8057861328125, 2.97955322265625, 3.1533203125, 3.32708740234375, 3.5008544921875, 3.67462158203125, 3.848388671875, 4.02215576171875, 4.1959228515625, 4.36968994140625, 4.54345703125, 4.71722412109375, 4.8909912109375, 5.06475830078125, 5.238525390625, 5.41229248046875, 5.5860595703125, 5.75982666015625, 5.93359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 13.0, 12.0, 22.0, 29.0, 47.0, 65.0, 104.0, 180.0, 242.0, 412.0, 669.0, 1108.0, 1879.0, 3377.0, 6690.0, 14267.0, 32613.0, 85138.0, 259348.0, 410895.0, 140871.0, 50002.0, 20394.0, 9419.0, 4557.0, 2483.0, 1441.0, 842.0, 478.0, 345.0, 213.0, 133.0, 94.0, 56.0, 38.0, 18.0, 18.0, 15.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.41796875, -5.2684326171875, -5.118896484375, -4.9693603515625, -4.81982421875, -4.6702880859375, -4.520751953125, -4.3712158203125, -4.2216796875, -4.0721435546875, -3.922607421875, -3.7730712890625, -3.62353515625, -3.4739990234375, -3.324462890625, -3.1749267578125, -3.025390625, -2.8758544921875, -2.726318359375, -2.5767822265625, -2.42724609375, -2.2777099609375, -2.128173828125, -1.9786376953125, -1.8291015625, -1.6795654296875, -1.530029296875, -1.3804931640625, -1.23095703125, -1.0814208984375, -0.931884765625, -0.7823486328125, -0.6328125, -0.4832763671875, -0.333740234375, -0.1842041015625, -0.03466796875, 0.1148681640625, 0.264404296875, 0.4139404296875, 0.5634765625, 0.7130126953125, 0.862548828125, 1.0120849609375, 1.16162109375, 1.3111572265625, 1.460693359375, 1.6102294921875, 1.759765625, 1.9093017578125, 2.058837890625, 2.2083740234375, 2.35791015625, 2.5074462890625, 2.656982421875, 2.8065185546875, 2.9560546875, 3.1055908203125, 3.255126953125, 3.4046630859375, 3.55419921875, 3.7037353515625, 3.853271484375, 4.0028076171875, 4.15234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 4.0, 9.0, 9.0, 10.0, 15.0, 17.0, 22.0, 22.0, 27.0, 36.0, 29.0, 38.0, 40.0, 39.0, 35.0, 53.0, 119.0, 356.0, 1525.0, 141.0, 77.0, 62.0, 49.0, 38.0, 44.0, 33.0, 39.0, 27.0, 26.0, 17.0, 12.0, 16.0, 10.0, 7.0, 8.0, 2.0, 3.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.099853515625, -20.48095703125, -19.862060546875, -19.2431640625, -18.624267578125, -18.00537109375, -17.386474609375, -16.767578125, -16.148681640625, -15.52978515625, -14.910888671875, -14.2919921875, -13.673095703125, -13.05419921875, -12.435302734375, -11.81640625, -11.197509765625, -10.57861328125, -9.959716796875, -9.3408203125, -8.721923828125, -8.10302734375, -7.484130859375, -6.865234375, -6.246337890625, -5.62744140625, -5.008544921875, -4.3896484375, -3.770751953125, -3.15185546875, -2.532958984375, -1.9140625, -1.295166015625, -0.67626953125, -0.057373046875, 0.5615234375, 1.180419921875, 1.79931640625, 2.418212890625, 3.037109375, 3.656005859375, 4.27490234375, 4.893798828125, 5.5126953125, 6.131591796875, 6.75048828125, 7.369384765625, 7.98828125, 8.607177734375, 9.22607421875, 9.844970703125, 10.4638671875, 11.082763671875, 11.70166015625, 12.320556640625, 12.939453125, 13.558349609375, 14.17724609375, 14.796142578125, 15.4150390625, 16.033935546875, 16.65283203125, 17.271728515625, 17.890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 11.0, 10.0, 12.0, 13.0, 23.0, 41.0, 59.0, 77.0, 138.0, 165.0, 252.0, 433.0, 905.0, 25391.0, 3110114.0, 6305.0, 608.0, 333.0, 253.0, 159.0, 130.0, 68.0, 53.0, 37.0, 33.0, 18.0, 16.0, 18.0, 10.0, 7.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-67.1875, -65.173828125, -63.16015625, -61.146484375, -59.1328125, -57.119140625, -55.10546875, -53.091796875, -51.078125, -49.064453125, -47.05078125, -45.037109375, -43.0234375, -41.009765625, -38.99609375, -36.982421875, -34.96875, -32.955078125, -30.94140625, -28.927734375, -26.9140625, -24.900390625, -22.88671875, -20.873046875, -18.859375, -16.845703125, -14.83203125, -12.818359375, -10.8046875, -8.791015625, -6.77734375, -4.763671875, -2.75, -0.736328125, 1.27734375, 3.291015625, 5.3046875, 7.318359375, 9.33203125, 11.345703125, 13.359375, 15.373046875, 17.38671875, 19.400390625, 21.4140625, 23.427734375, 25.44140625, 27.455078125, 29.46875, 31.482421875, 33.49609375, 35.509765625, 37.5234375, 39.537109375, 41.55078125, 43.564453125, 45.578125, 47.591796875, 49.60546875, 51.619140625, 53.6328125, 55.646484375, 57.66015625, 59.673828125, 61.6875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 19.0, 134.0, 450.0, 313.0, 88.0, 11.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-148.3781280517578, -145.7188720703125, -143.0596160888672, -140.40037536621094, -137.74111938476562, -135.0818634033203, -132.422607421875, -129.7633514404297, -127.1041030883789, -124.4448471069336, -121.78559875488281, -119.1263427734375, -116.46709442138672, -113.8078384399414, -111.14859008789062, -108.48933410644531, -105.830078125, -103.17082214355469, -100.5115737915039, -97.8523178100586, -95.19306945800781, -92.5338134765625, -89.87455749511719, -87.2153091430664, -84.55606079101562, -81.89680480957031, -79.23755645751953, -76.57830047607422, -73.91905212402344, -71.25979614257812, -68.60054016113281, -65.94129180908203, -63.28203582763672, -60.62278366088867, -57.963531494140625, -55.30427551269531, -52.645023345947266, -49.98577117919922, -47.32651901245117, -44.667266845703125, -42.00801086425781, -39.348758697509766, -36.68950653076172, -34.030250549316406, -31.37099838256836, -28.711746215820312, -26.052494049072266, -23.393239974975586, -20.733989715576172, -18.074737548828125, -15.415483474731445, -12.756231307983398, -10.096978187561035, -7.437725067138672, -4.778472900390625, -2.1192188262939453, 0.5400333404541016, 3.1992862224578857, 5.85853910446167, 8.517791748046875, 11.177044868469238, 13.836297988891602, 16.49555015563965, 19.154804229736328, 21.814056396484375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 8.0, 3.0, 5.0, 7.0, 8.0, 13.0, 13.0, 23.0, 17.0, 22.0, 25.0, 23.0, 21.0, 21.0, 27.0, 31.0, 23.0, 30.0, 32.0, 42.0, 42.0, 37.0, 46.0, 31.0, 38.0, 28.0, 44.0, 34.0, 35.0, 37.0, 30.0, 21.0, 27.0, 22.0, 23.0, 24.0, 20.0, 12.0, 12.0, 6.0, 5.0, 4.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.33206558227539, -47.75941467285156, -46.18675994873047, -44.61410903930664, -43.04145812988281, -41.46880340576172, -39.89615249633789, -38.32350158691406, -36.75084686279297, -35.17819595336914, -33.60554122924805, -32.03289031982422, -30.460237503051758, -28.887584686279297, -27.31493377685547, -25.742280960083008, -24.169628143310547, -22.596975326538086, -21.024322509765625, -19.451671600341797, -17.879018783569336, -16.306365966796875, -14.73371410369873, -13.161062240600586, -11.588409423828125, -10.015756607055664, -8.44310474395752, -6.870452404022217, -5.297800064086914, -3.7251477241516113, -2.1524953842163086, -0.5798435211181641, 0.9928092956542969, 2.5654616355895996, 4.138113975524902, 5.710766315460205, 7.283418655395508, 8.856071472167969, 10.428723335266113, 12.001375198364258, 13.574028015136719, 15.14668083190918, 16.71933364868164, 18.29198455810547, 19.86463737487793, 21.43729019165039, 23.00994110107422, 24.58259391784668, 26.15524673461914, 27.7278995513916, 29.300552368164062, 30.87320327758789, 32.44585418701172, 34.01850891113281, 35.59115982055664, 37.16381072998047, 38.73646545410156, 40.30911636352539, 41.881771087646484, 43.45442199707031, 45.027076721191406, 46.599727630615234, 48.17237854003906, 49.745033264160156, 51.317684173583984]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 10.0, 6.0, 13.0, 19.0, 13.0, 16.0, 15.0, 23.0, 20.0, 33.0, 32.0, 35.0, 40.0, 31.0, 44.0, 44.0, 34.0, 42.0, 41.0, 50.0, 37.0, 41.0, 31.0, 38.0, 32.0, 28.0, 27.0, 34.0, 21.0, 21.0, 26.0, 21.0, 11.0, 10.0, 8.0, 10.0, 4.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.078125, -4.8988037109375, -4.719482421875, -4.5401611328125, -4.36083984375, -4.1815185546875, -4.002197265625, -3.8228759765625, -3.6435546875, -3.4642333984375, -3.284912109375, -3.1055908203125, -2.92626953125, -2.7469482421875, -2.567626953125, -2.3883056640625, -2.208984375, -2.0296630859375, -1.850341796875, -1.6710205078125, -1.49169921875, -1.3123779296875, -1.133056640625, -0.9537353515625, -0.7744140625, -0.5950927734375, -0.415771484375, -0.2364501953125, -0.05712890625, 0.1221923828125, 0.301513671875, 0.4808349609375, 0.66015625, 0.8394775390625, 1.018798828125, 1.1981201171875, 1.37744140625, 1.5567626953125, 1.736083984375, 1.9154052734375, 2.0947265625, 2.2740478515625, 2.453369140625, 2.6326904296875, 2.81201171875, 2.9913330078125, 3.170654296875, 3.3499755859375, 3.529296875, 3.7086181640625, 3.887939453125, 4.0672607421875, 4.24658203125, 4.4259033203125, 4.605224609375, 4.7845458984375, 4.9638671875, 5.1431884765625, 5.322509765625, 5.5018310546875, 5.68115234375, 5.8604736328125, 6.039794921875, 6.2191162109375, 6.3984375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 9.0, 14.0, 11.0, 15.0, 22.0, 23.0, 35.0, 63.0, 82.0, 138.0, 264.0, 562.0, 1700.0, 8602.0, 87350.0, 1346825.0, 2476472.0, 249408.0, 18166.0, 2871.0, 769.0, 337.0, 176.0, 79.0, 60.0, 36.0, 34.0, 30.0, 27.0, 12.0, 14.0, 11.0, 6.0, 7.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.8348388671875, -11.364990234375, -10.8951416015625, -10.42529296875, -9.9554443359375, -9.485595703125, -9.0157470703125, -8.5458984375, -8.0760498046875, -7.606201171875, -7.1363525390625, -6.66650390625, -6.1966552734375, -5.726806640625, -5.2569580078125, -4.787109375, -4.3172607421875, -3.847412109375, -3.3775634765625, -2.90771484375, -2.4378662109375, -1.968017578125, -1.4981689453125, -1.0283203125, -0.5584716796875, -0.088623046875, 0.3812255859375, 0.85107421875, 1.3209228515625, 1.790771484375, 2.2606201171875, 2.73046875, 3.2003173828125, 3.670166015625, 4.1400146484375, 4.60986328125, 5.0797119140625, 5.549560546875, 6.0194091796875, 6.4892578125, 6.9591064453125, 7.428955078125, 7.8988037109375, 8.36865234375, 8.8385009765625, 9.308349609375, 9.7781982421875, 10.248046875, 10.7178955078125, 11.187744140625, 11.6575927734375, 12.12744140625, 12.5972900390625, 13.067138671875, 13.5369873046875, 14.0068359375, 14.4766845703125, 14.946533203125, 15.4163818359375, 15.88623046875, 16.3560791015625, 16.825927734375, 17.2957763671875, 17.765625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 12.0, 16.0, 22.0, 31.0, 39.0, 61.0, 99.0, 140.0, 204.0, 290.0, 401.0, 509.0, 565.0, 438.0, 375.0, 270.0, 169.0, 124.0, 79.0, 78.0, 38.0, 40.0, 18.0, 13.0, 11.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.421875, -14.971435546875, -14.52099609375, -14.070556640625, -13.6201171875, -13.169677734375, -12.71923828125, -12.268798828125, -11.818359375, -11.367919921875, -10.91748046875, -10.467041015625, -10.0166015625, -9.566162109375, -9.11572265625, -8.665283203125, -8.21484375, -7.764404296875, -7.31396484375, -6.863525390625, -6.4130859375, -5.962646484375, -5.51220703125, -5.061767578125, -4.611328125, -4.160888671875, -3.71044921875, -3.260009765625, -2.8095703125, -2.359130859375, -1.90869140625, -1.458251953125, -1.0078125, -0.557373046875, -0.10693359375, 0.343505859375, 0.7939453125, 1.244384765625, 1.69482421875, 2.145263671875, 2.595703125, 3.046142578125, 3.49658203125, 3.947021484375, 4.3974609375, 4.847900390625, 5.29833984375, 5.748779296875, 6.19921875, 6.649658203125, 7.10009765625, 7.550537109375, 8.0009765625, 8.451416015625, 8.90185546875, 9.352294921875, 9.802734375, 10.253173828125, 10.70361328125, 11.154052734375, 11.6044921875, 12.054931640625, 12.50537109375, 12.955810546875, 13.40625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 4.0, 9.0, 7.0, 15.0, 24.0, 28.0, 34.0, 50.0, 78.0, 109.0, 150.0, 189.0, 228.0, 416.0, 908.0, 10629.0, 3589451.0, 587536.0, 2688.0, 614.0, 334.0, 232.0, 142.0, 104.0, 83.0, 58.0, 46.0, 36.0, 20.0, 18.0, 17.0, 13.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.9375, -46.2744140625, -44.611328125, -42.9482421875, -41.28515625, -39.6220703125, -37.958984375, -36.2958984375, -34.6328125, -32.9697265625, -31.306640625, -29.6435546875, -27.98046875, -26.3173828125, -24.654296875, -22.9912109375, -21.328125, -19.6650390625, -18.001953125, -16.3388671875, -14.67578125, -13.0126953125, -11.349609375, -9.6865234375, -8.0234375, -6.3603515625, -4.697265625, -3.0341796875, -1.37109375, 0.2919921875, 1.955078125, 3.6181640625, 5.28125, 6.9443359375, 8.607421875, 10.2705078125, 11.93359375, 13.5966796875, 15.259765625, 16.9228515625, 18.5859375, 20.2490234375, 21.912109375, 23.5751953125, 25.23828125, 26.9013671875, 28.564453125, 30.2275390625, 31.890625, 33.5537109375, 35.216796875, 36.8798828125, 38.54296875, 40.2060546875, 41.869140625, 43.5322265625, 45.1953125, 46.8583984375, 48.521484375, 50.1845703125, 51.84765625, 53.5107421875, 55.173828125, 56.8369140625, 58.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 11.0, 33.0, 39.0, 64.0, 102.0, 135.0, 146.0, 162.0, 108.0, 81.0, 52.0, 29.0, 24.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.32976150512695, -58.35004806518555, -56.37033462524414, -54.39061737060547, -52.41090393066406, -50.431190490722656, -48.45147705078125, -46.471763610839844, -44.49205017089844, -42.51233673095703, -40.532623291015625, -38.55290985107422, -36.57319259643555, -34.59347915649414, -32.613765716552734, -30.634052276611328, -28.654335021972656, -26.67462158203125, -24.69490623474121, -22.715192794799805, -20.735477447509766, -18.75576400756836, -16.776050567626953, -14.79633617401123, -12.816621780395508, -10.836907386779785, -8.857192993164062, -6.877479553222656, -4.897765159606934, -2.918050765991211, -0.9383373260498047, 1.041377067565918, 3.021087646484375, 5.000802040100098, 6.980515956878662, 8.960229873657227, 10.93994426727295, 12.919658660888672, 14.899372100830078, 16.879085540771484, 18.858800888061523, 20.83851432800293, 22.81822967529297, 24.797943115234375, 26.77765655517578, 28.75737190246582, 30.737085342407227, 32.716800689697266, 34.69651412963867, 36.67622756958008, 38.655941009521484, 40.635658264160156, 42.61537170410156, 44.59508514404297, 46.574798583984375, 48.55451202392578, 50.53422546386719, 52.513938903808594, 54.49365234375, 56.473365783691406, 58.45308303833008, 60.432796478271484, 62.41250991821289, 64.39222717285156, 66.37194061279297]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 5.0, 2.0, 10.0, 15.0, 11.0, 12.0, 23.0, 11.0, 23.0, 20.0, 19.0, 27.0, 34.0, 25.0, 42.0, 30.0, 36.0, 44.0, 40.0, 38.0, 36.0, 38.0, 45.0, 36.0, 25.0, 31.0, 26.0, 31.0, 25.0, 25.0, 31.0, 21.0, 18.0, 25.0, 19.0, 17.0, 12.0, 8.0, 7.0, 6.0, 13.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.90130615234375, -34.78737258911133, -33.673439025878906, -32.559505462646484, -31.445571899414062, -30.33163833618164, -29.21770477294922, -28.103771209716797, -26.989837646484375, -25.875904083251953, -24.76197052001953, -23.64803695678711, -22.534103393554688, -21.420169830322266, -20.306236267089844, -19.192302703857422, -18.078369140625, -16.964435577392578, -15.850502014160156, -14.736568450927734, -13.622634887695312, -12.50870132446289, -11.394767761230469, -10.280834197998047, -9.166900634765625, -8.052967071533203, -6.939033508300781, -5.825099945068359, -4.7111663818359375, -3.5972328186035156, -2.4832992553710938, -1.3693656921386719, -0.25543212890625, 0.8585014343261719, 1.9724349975585938, 3.0863685607910156, 4.2003021240234375, 5.314235687255859, 6.428169250488281, 7.542102813720703, 8.656036376953125, 9.769969940185547, 10.883903503417969, 11.99783706665039, 13.111770629882812, 14.225704193115234, 15.339637756347656, 16.453571319580078, 17.5675048828125, 18.681438446044922, 19.795372009277344, 20.909305572509766, 22.023239135742188, 23.13717269897461, 24.25110626220703, 25.365039825439453, 26.478973388671875, 27.592906951904297, 28.70684051513672, 29.82077407836914, 30.934707641601562, 32.048641204833984, 33.162574768066406, 34.27650833129883, 35.39044189453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 9.0, 10.0, 10.0, 18.0, 15.0, 21.0, 21.0, 16.0, 30.0, 33.0, 39.0, 43.0, 36.0, 44.0, 55.0, 31.0, 48.0, 47.0, 43.0, 43.0, 44.0, 38.0, 37.0, 33.0, 29.0, 31.0, 30.0, 25.0, 15.0, 18.0, 11.0, 17.0, 15.0, 10.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.37890625, -6.19329833984375, -6.0076904296875, -5.82208251953125, -5.636474609375, -5.45086669921875, -5.2652587890625, -5.07965087890625, -4.89404296875, -4.70843505859375, -4.5228271484375, -4.33721923828125, -4.151611328125, -3.96600341796875, -3.7803955078125, -3.59478759765625, -3.4091796875, -3.22357177734375, -3.0379638671875, -2.85235595703125, -2.666748046875, -2.48114013671875, -2.2955322265625, -2.10992431640625, -1.92431640625, -1.73870849609375, -1.5531005859375, -1.36749267578125, -1.181884765625, -0.99627685546875, -0.8106689453125, -0.62506103515625, -0.439453125, -0.25384521484375, -0.0682373046875, 0.11737060546875, 0.302978515625, 0.48858642578125, 0.6741943359375, 0.85980224609375, 1.04541015625, 1.23101806640625, 1.4166259765625, 1.60223388671875, 1.787841796875, 1.97344970703125, 2.1590576171875, 2.34466552734375, 2.5302734375, 2.71588134765625, 2.9014892578125, 3.08709716796875, 3.272705078125, 3.45831298828125, 3.6439208984375, 3.82952880859375, 4.01513671875, 4.20074462890625, 4.3863525390625, 4.57196044921875, 4.757568359375, 4.94317626953125, 5.1287841796875, 5.31439208984375, 5.5]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 7.0, 18.0, 14.0, 42.0, 66.0, 116.0, 168.0, 269.0, 430.0, 648.0, 971.0, 1514.0, 2467.0, 3804.0, 6185.0, 10030.0, 15820.0, 25661.0, 43923.0, 74875.0, 131944.0, 198994.0, 201282.0, 135523.0, 78297.0, 45254.0, 26740.0, 16071.0, 10125.0, 6244.0, 4081.0, 2633.0, 1603.0, 959.0, 641.0, 385.0, 260.0, 176.0, 96.0, 60.0, 47.0, 36.0, 27.0, 14.0, 7.0, 8.0, 9.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.64990234375, -0.6302261352539062, -0.6105499267578125, -0.5908737182617188, -0.571197509765625, -0.5515213012695312, -0.5318450927734375, -0.5121688842773438, -0.49249267578125, -0.47281646728515625, -0.4531402587890625, -0.43346405029296875, -0.413787841796875, -0.39411163330078125, -0.3744354248046875, -0.35475921630859375, -0.3350830078125, -0.31540679931640625, -0.2957305908203125, -0.27605438232421875, -0.256378173828125, -0.23670196533203125, -0.2170257568359375, -0.19734954833984375, -0.17767333984375, -0.15799713134765625, -0.1383209228515625, -0.11864471435546875, -0.098968505859375, -0.07929229736328125, -0.0596160888671875, -0.03993988037109375, -0.020263671875, -0.00058746337890625, 0.0190887451171875, 0.03876495361328125, 0.058441162109375, 0.07811737060546875, 0.0977935791015625, 0.11746978759765625, 0.13714599609375, 0.15682220458984375, 0.1764984130859375, 0.19617462158203125, 0.215850830078125, 0.23552703857421875, 0.2552032470703125, 0.27487945556640625, 0.2945556640625, 0.31423187255859375, 0.3339080810546875, 0.35358428955078125, 0.373260498046875, 0.39293670654296875, 0.4126129150390625, 0.43228912353515625, 0.45196533203125, 0.47164154052734375, 0.4913177490234375, 0.5109939575195312, 0.530670166015625, 0.5503463745117188, 0.5700225830078125, 0.5896987915039062, 0.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 9.0, 3.0, 6.0, 7.0, 11.0, 10.0, 16.0, 9.0, 17.0, 17.0, 19.0, 20.0, 25.0, 33.0, 25.0, 35.0, 36.0, 44.0, 40.0, 37.0, 46.0, 1071.0, 42.0, 35.0, 41.0, 37.0, 46.0, 52.0, 26.0, 34.0, 31.0, 17.0, 19.0, 28.0, 19.0, 16.0, 11.0, 11.0, 8.0, 6.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.373321533203125, -3.26031494140625, -3.147308349609375, -3.0343017578125, -2.921295166015625, -2.80828857421875, -2.695281982421875, -2.582275390625, -2.469268798828125, -2.35626220703125, -2.243255615234375, -2.1302490234375, -2.017242431640625, -1.90423583984375, -1.791229248046875, -1.67822265625, -1.565216064453125, -1.45220947265625, -1.339202880859375, -1.2261962890625, -1.113189697265625, -1.00018310546875, -0.887176513671875, -0.774169921875, -0.661163330078125, -0.54815673828125, -0.435150146484375, -0.3221435546875, -0.209136962890625, -0.09613037109375, 0.016876220703125, 0.1298828125, 0.242889404296875, 0.35589599609375, 0.468902587890625, 0.5819091796875, 0.694915771484375, 0.80792236328125, 0.920928955078125, 1.033935546875, 1.146942138671875, 1.25994873046875, 1.372955322265625, 1.4859619140625, 1.598968505859375, 1.71197509765625, 1.824981689453125, 1.93798828125, 2.050994873046875, 2.16400146484375, 2.277008056640625, 2.3900146484375, 2.503021240234375, 2.61602783203125, 2.729034423828125, 2.842041015625, 2.955047607421875, 3.06805419921875, 3.181060791015625, 3.2940673828125, 3.407073974609375, 3.52008056640625, 3.633087158203125, 3.74609375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 16.0, 9.0, 16.0, 31.0, 52.0, 60.0, 100.0, 180.0, 237.0, 379.0, 581.0, 926.0, 1429.0, 2287.0, 3602.0, 5656.0, 8895.0, 14733.0, 23058.0, 37627.0, 61702.0, 99101.0, 146528.0, 1223456.0, 159896.0, 115149.0, 72915.0, 44636.0, 27867.0, 16938.0, 10620.0, 6588.0, 4341.0, 2742.0, 1651.0, 1107.0, 699.0, 438.0, 287.0, 214.0, 126.0, 89.0, 57.0, 34.0, 22.0, 17.0, 15.0, 3.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4012260437011719, -0.38814544677734375, -0.3750648498535156, -0.3619842529296875, -0.3489036560058594, -0.33582305908203125, -0.3227424621582031, -0.309661865234375, -0.2965812683105469, -0.28350067138671875, -0.2704200744628906, -0.2573394775390625, -0.24425888061523438, -0.23117828369140625, -0.21809768676757812, -0.20501708984375, -0.19193649291992188, -0.17885589599609375, -0.16577529907226562, -0.1526947021484375, -0.13961410522460938, -0.12653350830078125, -0.11345291137695312, -0.100372314453125, -0.08729171752929688, -0.07421112060546875, -0.061130523681640625, -0.0480499267578125, -0.034969329833984375, -0.02188873291015625, -0.008808135986328125, 0.0042724609375, 0.017353057861328125, 0.03043365478515625, 0.043514251708984375, 0.0565948486328125, 0.06967544555664062, 0.08275604248046875, 0.09583663940429688, 0.108917236328125, 0.12199783325195312, 0.13507843017578125, 0.14815902709960938, 0.1612396240234375, 0.17432022094726562, 0.18740081787109375, 0.20048141479492188, 0.21356201171875, 0.22664260864257812, 0.23972320556640625, 0.2528038024902344, 0.2658843994140625, 0.2789649963378906, 0.29204559326171875, 0.3051261901855469, 0.318206787109375, 0.3312873840332031, 0.34436798095703125, 0.3574485778808594, 0.3705291748046875, 0.3836097717285156, 0.39669036865234375, 0.4097709655761719, 0.4228515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 6.0, 2.0, 2.0, 5.0, 8.0, 11.0, 13.0, 18.0, 10.0, 20.0, 17.0, 22.0, 26.0, 49.0, 51.0, 39.0, 43.0, 48.0, 53.0, 54.0, 53.0, 53.0, 60.0, 47.0, 30.0, 54.0, 37.0, 37.0, 34.0, 20.0, 16.0, 6.0, 8.0, 11.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014600753784179688, -0.0014127492904663086, -0.0013654232025146484, -0.0013180971145629883, -0.0012707710266113281, -0.001223444938659668, -0.0011761188507080078, -0.0011287927627563477, -0.0010814666748046875, -0.0010341405868530273, -0.0009868144989013672, -0.000939488410949707, -0.0008921623229980469, -0.0008448362350463867, -0.0007975101470947266, -0.0007501840591430664, -0.0007028579711914062, -0.0006555318832397461, -0.0006082057952880859, -0.0005608797073364258, -0.0005135536193847656, -0.00046622753143310547, -0.0004189014434814453, -0.00037157535552978516, -0.000324249267578125, -0.00027692317962646484, -0.0002295970916748047, -0.00018227100372314453, -0.00013494491577148438, -8.761882781982422e-05, -4.029273986816406e-05, 7.033348083496094e-06, 5.435943603515625e-05, 0.0001016855239868164, 0.00014901161193847656, 0.00019633769989013672, 0.00024366378784179688, 0.00029098987579345703, 0.0003383159637451172, 0.00038564205169677734, 0.0004329681396484375, 0.00048029422760009766, 0.0005276203155517578, 0.000574946403503418, 0.0006222724914550781, 0.0006695985794067383, 0.0007169246673583984, 0.0007642507553100586, 0.0008115768432617188, 0.0008589029312133789, 0.0009062290191650391, 0.0009535551071166992, 0.0010008811950683594, 0.0010482072830200195, 0.0010955333709716797, 0.0011428594589233398, 0.001190185546875, 0.0012375116348266602, 0.0012848377227783203, 0.0013321638107299805, 0.0013794898986816406, 0.0014268159866333008, 0.001474142074584961, 0.001521468162536621, 0.0015687942504882812]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 8.0, 2.0, 9.0, 11.0, 6.0, 9.0, 13.0, 19.0, 8.0, 42.0, 44.0, 42.0, 45.0, 82.0, 93.0, 143.0, 190.0, 377.0, 1198.0, 39938.0, 990443.0, 13855.0, 887.0, 347.0, 186.0, 115.0, 84.0, 62.0, 42.0, 55.0, 26.0, 24.0, 18.0, 16.0, 15.0, 24.0, 18.0, 8.0, 9.0, 9.0, 3.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0280609130859375, -0.027194976806640625, -0.02632904052734375, -0.025463104248046875, -0.02459716796875, -0.023731231689453125, -0.02286529541015625, -0.021999359130859375, -0.0211334228515625, -0.020267486572265625, -0.01940155029296875, -0.018535614013671875, -0.017669677734375, -0.016803741455078125, -0.01593780517578125, -0.015071868896484375, -0.0142059326171875, -0.013339996337890625, -0.01247406005859375, -0.011608123779296875, -0.0107421875, -0.009876251220703125, -0.00901031494140625, -0.008144378662109375, -0.0072784423828125, -0.006412506103515625, -0.00554656982421875, -0.004680633544921875, -0.003814697265625, -0.002948760986328125, -0.00208282470703125, -0.001216888427734375, -0.0003509521484375, 0.000514984130859375, 0.00138092041015625, 0.002246856689453125, 0.00311279296875, 0.003978729248046875, 0.00484466552734375, 0.005710601806640625, 0.0065765380859375, 0.007442474365234375, 0.00830841064453125, 0.009174346923828125, 0.010040283203125, 0.010906219482421875, 0.01177215576171875, 0.012638092041015625, 0.0135040283203125, 0.014369964599609375, 0.01523590087890625, 0.016101837158203125, 0.0169677734375, 0.017833709716796875, 0.01869964599609375, 0.019565582275390625, 0.0204315185546875, 0.021297454833984375, 0.02216339111328125, 0.023029327392578125, 0.023895263671875, 0.024761199951171875, 0.02562713623046875, 0.026493072509765625, 0.0273590087890625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 189.0, 690.0, 123.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016015776200219989, -0.0013522914377972484, -0.0011030053719878197, -0.0008537191897630692, -0.0006044330075383186, -0.0003551468253135681, -0.00010586075950413942, 0.0001434254227206111, 0.0003927116049453616, 0.0006419977871701121, 0.0008912839111872017, 0.0011405700352042913, 0.0013898562174290419, 0.0016391423996537924, 0.001888428465463221, 0.0021377145312726498, 0.0023870007134974003, 0.002636286895722151, 0.0028855730779469013, 0.003134859260171652, 0.0033841454423964024, 0.003633431624621153, 0.0038827175740152597, 0.004132003523409367, 0.0043812901712954044, 0.004630576353520155, 0.0048798625357449055, 0.005129148717969656, 0.0053784349001944065, 0.005627721082419157, 0.00587700679898262, 0.006126292981207371, 0.006375580094754696, 0.006624866276979446, 0.006874152459204197, 0.0071234386414289474, 0.007372724823653698, 0.0076220110058784485, 0.007871297188103199, 0.00812058337032795, 0.0083698695525527, 0.00861915573477745, 0.008868441917002201, 0.009117728099226952, 0.009367014281451702, 0.009616300463676453, 0.009865586645901203, 0.010114872828125954, 0.01036415807902813, 0.01061344426125288, 0.01086273044347763, 0.011112016625702381, 0.011361302807927132, 0.011610588990151882, 0.011859875172376633, 0.012109161354601383, 0.012358447536826134, 0.012607733719050884, 0.012857019901275635, 0.013106306083500385, 0.013355592265725136, 0.013604878447949886, 0.013854164630174637, 0.014103450812399387, 0.014352736994624138]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 7.0, 1.0, 8.0, 5.0, 10.0, 18.0, 15.0, 18.0, 19.0, 16.0, 28.0, 28.0, 22.0, 31.0, 28.0, 32.0, 43.0, 30.0, 44.0, 47.0, 46.0, 32.0, 35.0, 37.0, 26.0, 40.0, 48.0, 31.0, 32.0, 29.0, 27.0, 23.0, 16.0, 21.0, 13.0, 22.0, 15.0, 14.0, 7.0, 9.0, 6.0, 12.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008257627487182617, -0.0008004559203982353, -0.0007751490920782089, -0.0007498422637581825, -0.0007245354354381561, -0.0006992286071181297, -0.0006739217787981033, -0.0006486149504780769, -0.0006233081221580505, -0.0005980012938380241, -0.0005726944655179977, -0.0005473876371979713, -0.000522080808877945, -0.0004967739805579185, -0.00047146715223789215, -0.00044616032391786575, -0.00042085349559783936, -0.00039554666727781296, -0.00037023983895778656, -0.00034493301063776016, -0.00031962618231773376, -0.00029431935399770737, -0.00026901252567768097, -0.00024370569735765457, -0.00021839886903762817, -0.00019309204071760178, -0.00016778521239757538, -0.00014247838407754898, -0.00011717155575752258, -9.186472743749619e-05, -6.655789911746979e-05, -4.125107079744339e-05, -1.5944242477416992e-05, 9.362585842609406e-06, 3.46694141626358e-05, 5.99762424826622e-05, 8.52830708026886e-05, 0.000110589899122715, 0.0001358967274427414, 0.0001612035557627678, 0.0001865103840827942, 0.0002118172124028206, 0.00023712404072284698, 0.0002624308690428734, 0.0002877376973628998, 0.0003130445256829262, 0.0003383513540029526, 0.000363658182322979, 0.00038896501064300537, 0.00041427183896303177, 0.00043957866728305817, 0.00046488549560308456, 0.000490192323923111, 0.0005154991522431374, 0.0005408059805631638, 0.0005661128088831902, 0.0005914196372032166, 0.000616726465523243, 0.0006420332938432693, 0.0006673401221632957, 0.0006926469504833221, 0.0007179537788033485, 0.0007432606071233749, 0.0007685674354434013, 0.0007938742637634277]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 9.0, 10.0, 10.0, 18.0, 15.0, 21.0, 21.0, 16.0, 30.0, 33.0, 39.0, 42.0, 37.0, 44.0, 55.0, 31.0, 48.0, 46.0, 44.0, 43.0, 44.0, 38.0, 37.0, 33.0, 29.0, 31.0, 30.0, 25.0, 15.0, 18.0, 11.0, 17.0, 15.0, 10.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.37890625, -6.19329833984375, -6.0076904296875, -5.82208251953125, -5.636474609375, -5.45086669921875, -5.2652587890625, -5.07965087890625, -4.89404296875, -4.70843505859375, -4.5228271484375, -4.33721923828125, -4.151611328125, -3.96600341796875, -3.7803955078125, -3.59478759765625, -3.4091796875, -3.22357177734375, -3.0379638671875, -2.85235595703125, -2.666748046875, -2.48114013671875, -2.2955322265625, -2.10992431640625, -1.92431640625, -1.73870849609375, -1.5531005859375, -1.36749267578125, -1.181884765625, -0.99627685546875, -0.8106689453125, -0.62506103515625, -0.439453125, -0.25384521484375, -0.0682373046875, 0.11737060546875, 0.302978515625, 0.48858642578125, 0.6741943359375, 0.85980224609375, 1.04541015625, 1.23101806640625, 1.4166259765625, 1.60223388671875, 1.787841796875, 1.97344970703125, 2.1590576171875, 2.34466552734375, 2.5302734375, 2.71588134765625, 2.9014892578125, 3.08709716796875, 3.272705078125, 3.45831298828125, 3.6439208984375, 3.82952880859375, 4.01513671875, 4.20074462890625, 4.3863525390625, 4.57196044921875, 4.757568359375, 4.94317626953125, 5.1287841796875, 5.31439208984375, 5.5]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 5.0, 11.0, 15.0, 16.0, 21.0, 24.0, 42.0, 50.0, 85.0, 130.0, 215.0, 360.0, 648.0, 1269.0, 2455.0, 5580.0, 14137.0, 46979.0, 190790.0, 537777.0, 179607.0, 44225.0, 13539.0, 5296.0, 2459.0, 1218.0, 638.0, 342.0, 211.0, 138.0, 57.0, 57.0, 32.0, 32.0, 21.0, 24.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.22265625, -6.04217529296875, -5.8616943359375, -5.68121337890625, -5.500732421875, -5.32025146484375, -5.1397705078125, -4.95928955078125, -4.77880859375, -4.59832763671875, -4.4178466796875, -4.23736572265625, -4.056884765625, -3.87640380859375, -3.6959228515625, -3.51544189453125, -3.3349609375, -3.15447998046875, -2.9739990234375, -2.79351806640625, -2.613037109375, -2.43255615234375, -2.2520751953125, -2.07159423828125, -1.89111328125, -1.71063232421875, -1.5301513671875, -1.34967041015625, -1.169189453125, -0.98870849609375, -0.8082275390625, -0.62774658203125, -0.447265625, -0.26678466796875, -0.0863037109375, 0.09417724609375, 0.274658203125, 0.45513916015625, 0.6356201171875, 0.81610107421875, 0.99658203125, 1.17706298828125, 1.3575439453125, 1.53802490234375, 1.718505859375, 1.89898681640625, 2.0794677734375, 2.25994873046875, 2.4404296875, 2.62091064453125, 2.8013916015625, 2.98187255859375, 3.162353515625, 3.34283447265625, 3.5233154296875, 3.70379638671875, 3.88427734375, 4.06475830078125, 4.2452392578125, 4.42572021484375, 4.606201171875, 4.78668212890625, 4.9671630859375, 5.14764404296875, 5.328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 4.0, 13.0, 17.0, 12.0, 20.0, 18.0, 19.0, 20.0, 33.0, 40.0, 43.0, 32.0, 45.0, 54.0, 93.0, 325.0, 1627.0, 153.0, 58.0, 47.0, 46.0, 47.0, 40.0, 35.0, 25.0, 24.0, 25.0, 23.0, 16.0, 16.0, 13.0, 11.0, 14.0, 12.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.0625, -19.419921875, -18.77734375, -18.134765625, -17.4921875, -16.849609375, -16.20703125, -15.564453125, -14.921875, -14.279296875, -13.63671875, -12.994140625, -12.3515625, -11.708984375, -11.06640625, -10.423828125, -9.78125, -9.138671875, -8.49609375, -7.853515625, -7.2109375, -6.568359375, -5.92578125, -5.283203125, -4.640625, -3.998046875, -3.35546875, -2.712890625, -2.0703125, -1.427734375, -0.78515625, -0.142578125, 0.5, 1.142578125, 1.78515625, 2.427734375, 3.0703125, 3.712890625, 4.35546875, 4.998046875, 5.640625, 6.283203125, 6.92578125, 7.568359375, 8.2109375, 8.853515625, 9.49609375, 10.138671875, 10.78125, 11.423828125, 12.06640625, 12.708984375, 13.3515625, 13.994140625, 14.63671875, 15.279296875, 15.921875, 16.564453125, 17.20703125, 17.849609375, 18.4921875, 19.134765625, 19.77734375, 20.419921875, 21.0625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 24.0, 14.0, 18.0, 31.0, 27.0, 55.0, 61.0, 103.0, 143.0, 214.0, 315.0, 508.0, 1852.0, 126176.0, 3010266.0, 4156.0, 673.0, 317.0, 228.0, 150.0, 99.0, 69.0, 36.0, 40.0, 22.0, 30.0, 16.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.28955078125, -51.5791015625, -49.86865234375, -48.158203125, -46.44775390625, -44.7373046875, -43.02685546875, -41.31640625, -39.60595703125, -37.8955078125, -36.18505859375, -34.474609375, -32.76416015625, -31.0537109375, -29.34326171875, -27.6328125, -25.92236328125, -24.2119140625, -22.50146484375, -20.791015625, -19.08056640625, -17.3701171875, -15.65966796875, -13.94921875, -12.23876953125, -10.5283203125, -8.81787109375, -7.107421875, -5.39697265625, -3.6865234375, -1.97607421875, -0.265625, 1.44482421875, 3.1552734375, 4.86572265625, 6.576171875, 8.28662109375, 9.9970703125, 11.70751953125, 13.41796875, 15.12841796875, 16.8388671875, 18.54931640625, 20.259765625, 21.97021484375, 23.6806640625, 25.39111328125, 27.1015625, 28.81201171875, 30.5224609375, 32.23291015625, 33.943359375, 35.65380859375, 37.3642578125, 39.07470703125, 40.78515625, 42.49560546875, 44.2060546875, 45.91650390625, 47.626953125, 49.33740234375, 51.0478515625, 52.75830078125, 54.46875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 103.0, 756.0, 157.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.90377807617188, -204.0189971923828, -200.1342010498047, -196.24942016601562, -192.36463928222656, -188.4798583984375, -184.59506225585938, -180.7102813720703, -176.82550048828125, -172.9407196044922, -169.05592346191406, -165.171142578125, -161.28636169433594, -157.40158081054688, -153.51678466796875, -149.6320037841797, -145.74722290039062, -141.86244201660156, -137.97764587402344, -134.09286499023438, -130.2080841064453, -126.32329559326172, -122.43850708007812, -118.55372619628906, -114.66893005371094, -110.78414154052734, -106.89936065673828, -103.01457214355469, -99.12979125976562, -95.24500274658203, -91.36021423339844, -87.47543334960938, -83.59065246582031, -79.70586395263672, -75.82108306884766, -71.93629455566406, -68.051513671875, -64.1667251586914, -60.28194046020508, -56.39715576171875, -52.51237106323242, -48.627586364746094, -44.742801666259766, -40.85801696777344, -36.973228454589844, -33.08844757080078, -29.203659057617188, -25.31887435913086, -21.43408966064453, -17.549304962158203, -13.664519309997559, -9.779733657836914, -5.894948959350586, -2.010164260864258, 1.8746223449707031, 5.759407043457031, 9.64419174194336, 13.528976440429688, 17.413761138916016, 21.298547744750977, 25.183332443237305, 29.068117141723633, 32.952903747558594, 36.83768844604492, 40.72247314453125]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 12.0, 8.0, 14.0, 15.0, 23.0, 15.0, 22.0, 31.0, 37.0, 28.0, 22.0, 44.0, 32.0, 32.0, 48.0, 47.0, 53.0, 38.0, 43.0, 49.0, 45.0, 44.0, 44.0, 43.0, 32.0, 36.0, 18.0, 20.0, 13.0, 15.0, 14.0, 14.0, 4.0, 11.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-57.84894943237305, -56.14171600341797, -54.43448257446289, -52.72724914550781, -51.02001953125, -49.31278610229492, -47.605552673339844, -45.898319244384766, -44.19108581542969, -42.48385238647461, -40.77661895751953, -39.06938934326172, -37.36215591430664, -35.65492248535156, -33.947689056396484, -32.240455627441406, -30.533226013183594, -28.825992584228516, -27.11876106262207, -25.411527633666992, -23.704296112060547, -21.99706268310547, -20.28982925415039, -18.582595825195312, -16.875364303588867, -15.168131828308105, -13.460899353027344, -11.753665924072266, -10.046433448791504, -8.339200973510742, -6.631967544555664, -4.924735069274902, -3.2175064086914062, -1.5102736949920654, 0.1969590187072754, 1.9041919708251953, 3.611424446105957, 5.318656921386719, 7.025890350341797, 8.733122825622559, 10.44035530090332, 12.147587776184082, 13.854820251464844, 15.562053680419922, 17.269287109375, 18.976518630981445, 20.683752059936523, 22.39098358154297, 24.098217010498047, 25.805450439453125, 27.51268196105957, 29.21991539001465, 30.927146911621094, 32.63438034057617, 34.34161376953125, 36.04884719848633, 37.756080627441406, 39.463314056396484, 41.17054748535156, 42.877777099609375, 44.58501052856445, 46.29224395751953, 47.99947738647461, 49.70671081542969, 51.4139404296875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 10.0, 18.0, 15.0, 13.0, 11.0, 19.0, 27.0, 23.0, 31.0, 52.0, 36.0, 42.0, 35.0, 48.0, 42.0, 48.0, 54.0, 43.0, 34.0, 41.0, 46.0, 41.0, 30.0, 34.0, 19.0, 26.0, 18.0, 24.0, 20.0, 15.0, 17.0, 12.0, 5.0, 11.0, 7.0, 7.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2109375, -6.019775390625, -5.82861328125, -5.637451171875, -5.4462890625, -5.255126953125, -5.06396484375, -4.872802734375, -4.681640625, -4.490478515625, -4.29931640625, -4.108154296875, -3.9169921875, -3.725830078125, -3.53466796875, -3.343505859375, -3.15234375, -2.961181640625, -2.77001953125, -2.578857421875, -2.3876953125, -2.196533203125, -2.00537109375, -1.814208984375, -1.623046875, -1.431884765625, -1.24072265625, -1.049560546875, -0.8583984375, -0.667236328125, -0.47607421875, -0.284912109375, -0.09375, 0.097412109375, 0.28857421875, 0.479736328125, 0.6708984375, 0.862060546875, 1.05322265625, 1.244384765625, 1.435546875, 1.626708984375, 1.81787109375, 2.009033203125, 2.2001953125, 2.391357421875, 2.58251953125, 2.773681640625, 2.96484375, 3.156005859375, 3.34716796875, 3.538330078125, 3.7294921875, 3.920654296875, 4.11181640625, 4.302978515625, 4.494140625, 4.685302734375, 4.87646484375, 5.067626953125, 5.2587890625, 5.449951171875, 5.64111328125, 5.832275390625, 6.0234375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 11.0, 4.0, 14.0, 16.0, 21.0, 25.0, 21.0, 35.0, 50.0, 62.0, 71.0, 87.0, 138.0, 244.0, 472.0, 1233.0, 5151.0, 44448.0, 736769.0, 2841649.0, 525699.0, 31761.0, 4076.0, 1028.0, 419.0, 203.0, 126.0, 90.0, 68.0, 54.0, 49.0, 44.0, 22.0, 30.0, 16.0, 15.0, 17.0, 11.0, 9.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.7890625, -15.31689453125, -14.8447265625, -14.37255859375, -13.900390625, -13.42822265625, -12.9560546875, -12.48388671875, -12.01171875, -11.53955078125, -11.0673828125, -10.59521484375, -10.123046875, -9.65087890625, -9.1787109375, -8.70654296875, -8.234375, -7.76220703125, -7.2900390625, -6.81787109375, -6.345703125, -5.87353515625, -5.4013671875, -4.92919921875, -4.45703125, -3.98486328125, -3.5126953125, -3.04052734375, -2.568359375, -2.09619140625, -1.6240234375, -1.15185546875, -0.6796875, -0.20751953125, 0.2646484375, 0.73681640625, 1.208984375, 1.68115234375, 2.1533203125, 2.62548828125, 3.09765625, 3.56982421875, 4.0419921875, 4.51416015625, 4.986328125, 5.45849609375, 5.9306640625, 6.40283203125, 6.875, 7.34716796875, 7.8193359375, 8.29150390625, 8.763671875, 9.23583984375, 9.7080078125, 10.18017578125, 10.65234375, 11.12451171875, 11.5966796875, 12.06884765625, 12.541015625, 13.01318359375, 13.4853515625, 13.95751953125, 14.4296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 4.0, 12.0, 17.0, 27.0, 42.0, 41.0, 57.0, 75.0, 127.0, 171.0, 206.0, 315.0, 405.0, 508.0, 478.0, 435.0, 330.0, 219.0, 178.0, 126.0, 96.0, 54.0, 48.0, 33.0, 17.0, 14.0, 13.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.67529296875, -12.2802734375, -11.88525390625, -11.490234375, -11.09521484375, -10.7001953125, -10.30517578125, -9.91015625, -9.51513671875, -9.1201171875, -8.72509765625, -8.330078125, -7.93505859375, -7.5400390625, -7.14501953125, -6.75, -6.35498046875, -5.9599609375, -5.56494140625, -5.169921875, -4.77490234375, -4.3798828125, -3.98486328125, -3.58984375, -3.19482421875, -2.7998046875, -2.40478515625, -2.009765625, -1.61474609375, -1.2197265625, -0.82470703125, -0.4296875, -0.03466796875, 0.3603515625, 0.75537109375, 1.150390625, 1.54541015625, 1.9404296875, 2.33544921875, 2.73046875, 3.12548828125, 3.5205078125, 3.91552734375, 4.310546875, 4.70556640625, 5.1005859375, 5.49560546875, 5.890625, 6.28564453125, 6.6806640625, 7.07568359375, 7.470703125, 7.86572265625, 8.2607421875, 8.65576171875, 9.05078125, 9.44580078125, 9.8408203125, 10.23583984375, 10.630859375, 11.02587890625, 11.4208984375, 11.81591796875, 12.2109375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 11.0, 24.0, 40.0, 61.0, 90.0, 118.0, 185.0, 248.0, 335.0, 592.0, 6994.0, 4024997.0, 158139.0, 1025.0, 447.0, 302.0, 206.0, 142.0, 92.0, 77.0, 42.0, 40.0, 22.0, 13.0, 11.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.4375, -67.3154296875, -65.193359375, -63.0712890625, -60.94921875, -58.8271484375, -56.705078125, -54.5830078125, -52.4609375, -50.3388671875, -48.216796875, -46.0947265625, -43.97265625, -41.8505859375, -39.728515625, -37.6064453125, -35.484375, -33.3623046875, -31.240234375, -29.1181640625, -26.99609375, -24.8740234375, -22.751953125, -20.6298828125, -18.5078125, -16.3857421875, -14.263671875, -12.1416015625, -10.01953125, -7.8974609375, -5.775390625, -3.6533203125, -1.53125, 0.5908203125, 2.712890625, 4.8349609375, 6.95703125, 9.0791015625, 11.201171875, 13.3232421875, 15.4453125, 17.5673828125, 19.689453125, 21.8115234375, 23.93359375, 26.0556640625, 28.177734375, 30.2998046875, 32.421875, 34.5439453125, 36.666015625, 38.7880859375, 40.91015625, 43.0322265625, 45.154296875, 47.2763671875, 49.3984375, 51.5205078125, 53.642578125, 55.7646484375, 57.88671875, 60.0087890625, 62.130859375, 64.2529296875, 66.375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 22.0, 113.0, 277.0, 376.0, 174.0, 42.0, 9.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.79660034179688, -235.9137725830078, -231.03094482421875, -226.1481170654297, -221.26528930664062, -216.38246154785156, -211.4996337890625, -206.6168212890625, -201.73397827148438, -196.8511505126953, -191.96832275390625, -187.0854949951172, -182.20266723632812, -177.31983947753906, -172.43701171875, -167.55419921875, -162.67137145996094, -157.78854370117188, -152.9057159423828, -148.02288818359375, -143.1400604248047, -138.25723266601562, -133.37440490722656, -128.4915771484375, -123.60875701904297, -118.7259292602539, -113.84310150146484, -108.96027374267578, -104.07745361328125, -99.19462585449219, -94.31179809570312, -89.42897033691406, -84.54615020751953, -79.66332244873047, -74.7804946899414, -69.89766693115234, -65.01484680175781, -60.132015228271484, -55.24919128417969, -50.366363525390625, -45.48353576660156, -40.6007080078125, -35.71788024902344, -30.83505630493164, -25.952228546142578, -21.069400787353516, -16.186574935913086, -11.303749084472656, -6.420921325683594, -1.5380945205688477, 3.3447322845458984, 8.227559089660645, 13.11038589477539, 17.993213653564453, 22.876039505004883, 27.758865356445312, 32.641693115234375, 37.52452087402344, 42.4073486328125, 47.2901725769043, 52.17300033569336, 57.05582809448242, 61.93865203857422, 66.82147979736328, 71.70430755615234]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 6.0, 6.0, 11.0, 14.0, 17.0, 11.0, 20.0, 22.0, 18.0, 19.0, 27.0, 19.0, 25.0, 35.0, 32.0, 39.0, 37.0, 36.0, 35.0, 33.0, 32.0, 31.0, 34.0, 44.0, 40.0, 35.0, 33.0, 40.0, 29.0, 29.0, 23.0, 16.0, 18.0, 13.0, 25.0, 11.0, 12.0, 15.0, 12.0, 4.0, 7.0, 3.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.04292297363281, -33.971466064453125, -32.90000915527344, -31.82855224609375, -30.757097244262695, -29.685640335083008, -28.61418342590332, -27.542726516723633, -26.471271514892578, -25.39981460571289, -24.328357696533203, -23.256900787353516, -22.18544578552246, -21.113988876342773, -20.042531967163086, -18.9710750579834, -17.89961814880371, -16.828161239624023, -15.756705284118652, -14.685248374938965, -13.613792419433594, -12.542335510253906, -11.470878601074219, -10.399421691894531, -9.32796573638916, -8.256508827209473, -7.185052871704102, -6.113595962524414, -5.042139530181885, -3.9706830978393555, -2.899226188659668, -1.8277697563171387, -0.7563133239746094, 0.3151432275772095, 1.3865997791290283, 2.4580564498901367, 3.529512882232666, 4.600969314575195, 5.672426223754883, 6.743882656097412, 7.815339088439941, 8.886795997619629, 9.958251953125, 11.029708862304688, 12.101165771484375, 13.172621726989746, 14.244078636169434, 15.315534591674805, 16.386991500854492, 17.45844841003418, 18.529905319213867, 19.601360321044922, 20.67281723022461, 21.744274139404297, 22.815731048583984, 23.887187957763672, 24.95864486694336, 26.030101776123047, 27.101558685302734, 28.173015594482422, 29.244470596313477, 30.315927505493164, 31.38738441467285, 32.458839416503906, 33.530296325683594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 9.0, 4.0, 6.0, 8.0, 9.0, 8.0, 17.0, 11.0, 14.0, 22.0, 25.0, 25.0, 24.0, 35.0, 31.0, 32.0, 46.0, 34.0, 50.0, 32.0, 35.0, 41.0, 39.0, 38.0, 37.0, 44.0, 28.0, 30.0, 24.0, 30.0, 28.0, 23.0, 18.0, 15.0, 14.0, 23.0, 14.0, 14.0, 12.0, 12.0, 9.0, 2.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.859375, -4.6976318359375, -4.535888671875, -4.3741455078125, -4.21240234375, -4.0506591796875, -3.888916015625, -3.7271728515625, -3.5654296875, -3.4036865234375, -3.241943359375, -3.0802001953125, -2.91845703125, -2.7567138671875, -2.594970703125, -2.4332275390625, -2.271484375, -2.1097412109375, -1.947998046875, -1.7862548828125, -1.62451171875, -1.4627685546875, -1.301025390625, -1.1392822265625, -0.9775390625, -0.8157958984375, -0.654052734375, -0.4923095703125, -0.33056640625, -0.1688232421875, -0.007080078125, 0.1546630859375, 0.31640625, 0.4781494140625, 0.639892578125, 0.8016357421875, 0.96337890625, 1.1251220703125, 1.286865234375, 1.4486083984375, 1.6103515625, 1.7720947265625, 1.933837890625, 2.0955810546875, 2.25732421875, 2.4190673828125, 2.580810546875, 2.7425537109375, 2.904296875, 3.0660400390625, 3.227783203125, 3.3895263671875, 3.55126953125, 3.7130126953125, 3.874755859375, 4.0364990234375, 4.1982421875, 4.3599853515625, 4.521728515625, 4.6834716796875, 4.84521484375, 5.0069580078125, 5.168701171875, 5.3304443359375, 5.4921875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 10.0, 14.0, 19.0, 41.0, 57.0, 101.0, 113.0, 166.0, 231.0, 354.0, 569.0, 818.0, 1181.0, 1793.0, 2692.0, 3967.0, 5945.0, 9086.0, 13553.0, 21704.0, 34028.0, 54335.0, 86947.0, 133184.0, 177578.0, 168415.0, 120149.0, 77083.0, 48248.0, 30137.0, 19304.0, 12282.0, 8118.0, 5440.0, 3488.0, 2456.0, 1597.0, 1056.0, 771.0, 516.0, 328.0, 222.0, 148.0, 108.0, 66.0, 43.0, 35.0, 23.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.54541015625, -0.5282974243164062, -0.5111846923828125, -0.49407196044921875, -0.476959228515625, -0.45984649658203125, -0.4427337646484375, -0.42562103271484375, -0.40850830078125, -0.39139556884765625, -0.3742828369140625, -0.35717010498046875, -0.340057373046875, -0.32294464111328125, -0.3058319091796875, -0.28871917724609375, -0.2716064453125, -0.25449371337890625, -0.2373809814453125, -0.22026824951171875, -0.203155517578125, -0.18604278564453125, -0.1689300537109375, -0.15181732177734375, -0.13470458984375, -0.11759185791015625, -0.1004791259765625, -0.08336639404296875, -0.066253662109375, -0.04914093017578125, -0.0320281982421875, -0.01491546630859375, 0.002197265625, 0.01930999755859375, 0.0364227294921875, 0.05353546142578125, 0.070648193359375, 0.08776092529296875, 0.1048736572265625, 0.12198638916015625, 0.13909912109375, 0.15621185302734375, 0.1733245849609375, 0.19043731689453125, 0.207550048828125, 0.22466278076171875, 0.2417755126953125, 0.25888824462890625, 0.2760009765625, 0.29311370849609375, 0.3102264404296875, 0.32733917236328125, 0.344451904296875, 0.36156463623046875, 0.3786773681640625, 0.39579010009765625, 0.41290283203125, 0.43001556396484375, 0.4471282958984375, 0.46424102783203125, 0.481353759765625, 0.49846649169921875, 0.5155792236328125, 0.5326919555664062, 0.5498046875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 13.0, 11.0, 7.0, 22.0, 15.0, 22.0, 17.0, 18.0, 31.0, 35.0, 26.0, 41.0, 42.0, 35.0, 42.0, 36.0, 24.0, 1064.0, 41.0, 29.0, 35.0, 37.0, 39.0, 47.0, 43.0, 27.0, 30.0, 22.0, 24.0, 33.0, 17.0, 17.0, 14.0, 12.0, 15.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.953125, -3.839752197265625, -3.72637939453125, -3.613006591796875, -3.4996337890625, -3.386260986328125, -3.27288818359375, -3.159515380859375, -3.046142578125, -2.932769775390625, -2.81939697265625, -2.706024169921875, -2.5926513671875, -2.479278564453125, -2.36590576171875, -2.252532958984375, -2.13916015625, -2.025787353515625, -1.91241455078125, -1.799041748046875, -1.6856689453125, -1.572296142578125, -1.45892333984375, -1.345550537109375, -1.232177734375, -1.118804931640625, -1.00543212890625, -0.892059326171875, -0.7786865234375, -0.665313720703125, -0.55194091796875, -0.438568115234375, -0.3251953125, -0.211822509765625, -0.09844970703125, 0.014923095703125, 0.1282958984375, 0.241668701171875, 0.35504150390625, 0.468414306640625, 0.581787109375, 0.695159912109375, 0.80853271484375, 0.921905517578125, 1.0352783203125, 1.148651123046875, 1.26202392578125, 1.375396728515625, 1.48876953125, 1.602142333984375, 1.71551513671875, 1.828887939453125, 1.9422607421875, 2.055633544921875, 2.16900634765625, 2.282379150390625, 2.395751953125, 2.509124755859375, 2.62249755859375, 2.735870361328125, 2.8492431640625, 2.962615966796875, 3.07598876953125, 3.189361572265625, 3.302734375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 2.0, 5.0, 12.0, 17.0, 38.0, 33.0, 69.0, 104.0, 152.0, 249.0, 368.0, 558.0, 920.0, 1468.0, 2330.0, 3840.0, 6241.0, 10632.0, 17437.0, 29616.0, 50414.0, 87917.0, 140425.0, 1226280.0, 190720.0, 132013.0, 80833.0, 46950.0, 26997.0, 15782.0, 9542.0, 5852.0, 3560.0, 2112.0, 1352.0, 823.0, 518.0, 327.0, 205.0, 137.0, 102.0, 58.0, 35.0, 33.0, 18.0, 15.0, 9.0, 8.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464111328125, -0.44910430908203125, -0.4340972900390625, -0.41909027099609375, -0.404083251953125, -0.38907623291015625, -0.3740692138671875, -0.35906219482421875, -0.34405517578125, -0.32904815673828125, -0.3140411376953125, -0.29903411865234375, -0.284027099609375, -0.26902008056640625, -0.2540130615234375, -0.23900604248046875, -0.2239990234375, -0.20899200439453125, -0.1939849853515625, -0.17897796630859375, -0.163970947265625, -0.14896392822265625, -0.1339569091796875, -0.11894989013671875, -0.10394287109375, -0.08893585205078125, -0.0739288330078125, -0.05892181396484375, -0.043914794921875, -0.02890777587890625, -0.0139007568359375, 0.00110626220703125, 0.01611328125, 0.03112030029296875, 0.0461273193359375, 0.06113433837890625, 0.076141357421875, 0.09114837646484375, 0.1061553955078125, 0.12116241455078125, 0.13616943359375, 0.15117645263671875, 0.1661834716796875, 0.18119049072265625, 0.196197509765625, 0.21120452880859375, 0.2262115478515625, 0.24121856689453125, 0.2562255859375, 0.27123260498046875, 0.2862396240234375, 0.30124664306640625, 0.316253662109375, 0.33126068115234375, 0.3462677001953125, 0.36127471923828125, 0.37628173828125, 0.39128875732421875, 0.4062957763671875, 0.42130279541015625, 0.436309814453125, 0.45131683349609375, 0.4663238525390625, 0.48133087158203125, 0.496337890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 6.0, 10.0, 11.0, 14.0, 19.0, 25.0, 25.0, 26.0, 38.0, 54.0, 81.0, 71.0, 78.0, 71.0, 89.0, 60.0, 80.0, 51.0, 41.0, 34.0, 32.0, 25.0, 17.0, 15.0, 7.0, 4.0, 5.0, 5.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.0021757185459136963, -0.0021045804023742676, -0.002033442258834839, -0.00196230411529541, -0.0018911659717559814, -0.0018200278282165527, -0.001748889684677124, -0.0016777515411376953, -0.0016066133975982666, -0.0015354752540588379, -0.0014643371105194092, -0.0013931989669799805, -0.0013220608234405518, -0.001250922679901123, -0.0011797845363616943, -0.0011086463928222656, -0.001037508249282837, -0.0009663701057434082, -0.0008952319622039795, -0.0008240938186645508, -0.0007529556751251221, -0.0006818175315856934, -0.0006106793880462646, -0.0005395412445068359, -0.0004684031009674072, -0.0003972649574279785, -0.0003261268138885498, -0.0002549886703491211, -0.00018385052680969238, -0.00011271238327026367, -4.157423973083496e-05, 2.956390380859375e-05, 0.00010070204734802246, 0.00017184019088745117, 0.00024297833442687988, 0.0003141164779663086, 0.0003852546215057373, 0.000456392765045166, 0.0005275309085845947, 0.0005986690521240234, 0.0006698071956634521, 0.0007409453392028809, 0.0008120834827423096, 0.0008832216262817383, 0.000954359769821167, 0.0010254979133605957, 0.0010966360569000244, 0.0011677742004394531, 0.0012389123439788818, 0.0013100504875183105, 0.0013811886310577393, 0.001452326774597168, 0.0015234649181365967, 0.0015946030616760254, 0.001665741205215454, 0.0017368793487548828, 0.0018080174922943115, 0.0018791556358337402, 0.001950293779373169, 0.0020214319229125977, 0.0020925700664520264, 0.002163708209991455, 0.002234846353530884, 0.0023059844970703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 7.0, 4.0, 8.0, 13.0, 14.0, 21.0, 36.0, 38.0, 55.0, 89.0, 140.0, 237.0, 532.0, 11808.0, 1032062.0, 2498.0, 414.0, 198.0, 103.0, 76.0, 58.0, 32.0, 33.0, 23.0, 16.0, 14.0, 11.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049835205078125, -0.048295021057128906, -0.04675483703613281, -0.04521465301513672, -0.043674468994140625, -0.04213428497314453, -0.04059410095214844, -0.039053916931152344, -0.03751373291015625, -0.035973548889160156, -0.03443336486816406, -0.03289318084716797, -0.031352996826171875, -0.02981281280517578, -0.028272628784179688, -0.026732444763183594, -0.0251922607421875, -0.023652076721191406, -0.022111892700195312, -0.02057170867919922, -0.019031524658203125, -0.01749134063720703, -0.015951156616210938, -0.014410972595214844, -0.01287078857421875, -0.011330604553222656, -0.009790420532226562, -0.008250236511230469, -0.006710052490234375, -0.005169868469238281, -0.0036296844482421875, -0.0020895004272460938, -0.00054931640625, 0.0009908676147460938, 0.0025310516357421875, 0.004071235656738281, 0.005611419677734375, 0.007151603698730469, 0.008691787719726562, 0.010231971740722656, 0.01177215576171875, 0.013312339782714844, 0.014852523803710938, 0.01639270782470703, 0.017932891845703125, 0.01947307586669922, 0.021013259887695312, 0.022553443908691406, 0.0240936279296875, 0.025633811950683594, 0.027173995971679688, 0.02871417999267578, 0.030254364013671875, 0.03179454803466797, 0.03333473205566406, 0.034874916076660156, 0.03641510009765625, 0.037955284118652344, 0.03949546813964844, 0.04103565216064453, 0.042575836181640625, 0.04411602020263672, 0.04565620422363281, 0.047196388244628906, 0.048736572265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 20.0, 31.0, 69.0, 85.0, 117.0, 156.0, 145.0, 138.0, 89.0, 59.0, 32.0, 29.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010949239367619157, -0.0010528148850426078, -0.0010107058333232999, -0.0009685968398116529, -0.000926487788092345, -0.0008843787363730371, -0.0008422697428613901, -0.0008001606911420822, -0.0007580516394227743, -0.0007159425877034664, -0.0006738335359841585, -0.0006317245424725115, -0.0005896154907532036, -0.0005475064390338957, -0.0005053974455222487, -0.00046328839380294085, -0.00042117934208363295, -0.00037907029036432505, -0.0003369612677488476, -0.00029485224513337016, -0.00025274319341406226, -0.0002106341562466696, -0.00016852511907927692, -0.00012641609646379948, -8.430704474449158e-05, -4.2198007577098906e-05, -8.897040970623493e-08, 4.2020066757686436e-05, 8.412910392507911e-05, 0.00012623814109247178, 0.00016834717825986445, 0.0002104562008753419, 0.0002525653690099716, 0.0002946744207292795, 0.00033678344334475696, 0.0003788924659602344, 0.0004210015176795423, 0.0004631105693988502, 0.0005052195629104972, 0.0005473286146298051, 0.000589437666349113, 0.0006315467180684209, 0.0006736557697877288, 0.0007157647632993758, 0.0007578738150186837, 0.0007999828667379916, 0.0008420918602496386, 0.0008842009119689465, 0.0009263099636882544, 0.0009684190154075623, 0.0010105280671268702, 0.001052637118846178, 0.001094746170565486, 0.001136855105869472, 0.00117896415758878, 0.0012210732093080878, 0.0012631822610273957, 0.0013052913127467036, 0.0013474003644660115, 0.0013895094161853194, 0.0014316183514893055, 0.0014737274032086134, 0.0015158364549279213, 0.0015579455066472292, 0.001600054558366537]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 8.0, 9.0, 12.0, 20.0, 12.0, 10.0, 18.0, 17.0, 29.0, 22.0, 21.0, 32.0, 40.0, 39.0, 36.0, 34.0, 31.0, 39.0, 27.0, 47.0, 50.0, 38.0, 40.0, 49.0, 25.0, 35.0, 31.0, 28.0, 27.0, 30.0, 20.0, 13.0, 19.0, 15.0, 17.0, 6.0, 4.0, 4.0, 9.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007822513580322266, -0.0007548760622739792, -0.0007275007665157318, -0.0007001254707574844, -0.0006727501749992371, -0.0006453748792409897, -0.0006179995834827423, -0.0005906242877244949, -0.0005632489919662476, -0.0005358736962080002, -0.0005084984004497528, -0.00048112310469150543, -0.00045374780893325806, -0.0004263725131750107, -0.0003989972174167633, -0.00037162192165851593, -0.00034424662590026855, -0.0003168713301420212, -0.0002894960343837738, -0.00026212073862552643, -0.00023474544286727905, -0.00020737014710903168, -0.0001799948513507843, -0.00015261955559253693, -0.00012524425983428955, -9.786896407604218e-05, -7.04936683177948e-05, -4.3118372559547424e-05, -1.574307680130005e-05, 1.1632218956947327e-05, 3.90075147151947e-05, 6.638281047344208e-05, 9.375810623168945e-05, 0.00012113340198993683, 0.0001485086977481842, 0.00017588399350643158, 0.00020325928926467896, 0.00023063458502292633, 0.0002580098807811737, 0.0002853851765394211, 0.00031276047229766846, 0.00034013576805591583, 0.0003675110638141632, 0.0003948863595724106, 0.00042226165533065796, 0.00044963695108890533, 0.0004770122468471527, 0.0005043875426054001, 0.0005317628383636475, 0.0005591381341218948, 0.0005865134298801422, 0.0006138887256383896, 0.000641264021396637, 0.0006686393171548843, 0.0006960146129131317, 0.0007233899086713791, 0.0007507652044296265, 0.0007781405001878738, 0.0008055157959461212, 0.0008328910917043686, 0.000860266387462616, 0.0008876416832208633, 0.0009150169789791107, 0.0009423922747373581, 0.0009697675704956055]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 9.0, 4.0, 6.0, 8.0, 9.0, 8.0, 17.0, 11.0, 14.0, 22.0, 25.0, 25.0, 24.0, 35.0, 31.0, 32.0, 46.0, 34.0, 50.0, 32.0, 34.0, 42.0, 39.0, 38.0, 37.0, 44.0, 28.0, 30.0, 24.0, 30.0, 28.0, 23.0, 18.0, 15.0, 14.0, 23.0, 14.0, 14.0, 12.0, 12.0, 9.0, 2.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.859375, -4.6976318359375, -4.535888671875, -4.3741455078125, -4.21240234375, -4.0506591796875, -3.888916015625, -3.7271728515625, -3.5654296875, -3.4036865234375, -3.241943359375, -3.0802001953125, -2.91845703125, -2.7567138671875, -2.594970703125, -2.4332275390625, -2.271484375, -2.1097412109375, -1.947998046875, -1.7862548828125, -1.62451171875, -1.4627685546875, -1.301025390625, -1.1392822265625, -0.9775390625, -0.8157958984375, -0.654052734375, -0.4923095703125, -0.33056640625, -0.1688232421875, -0.007080078125, 0.1546630859375, 0.31640625, 0.4781494140625, 0.639892578125, 0.8016357421875, 0.96337890625, 1.1251220703125, 1.286865234375, 1.4486083984375, 1.6103515625, 1.7720947265625, 1.933837890625, 2.0955810546875, 2.25732421875, 2.4190673828125, 2.580810546875, 2.7425537109375, 2.904296875, 3.0660400390625, 3.227783203125, 3.3895263671875, 3.55126953125, 3.7130126953125, 3.874755859375, 4.0364990234375, 4.1982421875, 4.3599853515625, 4.521728515625, 4.6834716796875, 4.84521484375, 5.0069580078125, 5.168701171875, 5.3304443359375, 5.4921875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 9.0, 12.0, 14.0, 25.0, 47.0, 72.0, 116.0, 167.0, 294.0, 542.0, 906.0, 1717.0, 3442.0, 6723.0, 13185.0, 27565.0, 60855.0, 145021.0, 355765.0, 247301.0, 100155.0, 43205.0, 20677.0, 10041.0, 5022.0, 2556.0, 1365.0, 703.0, 410.0, 213.0, 153.0, 94.0, 53.0, 34.0, 22.0, 16.0, 10.0, 4.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.30218505859375, -4.1668701171875, -4.03155517578125, -3.896240234375, -3.76092529296875, -3.6256103515625, -3.49029541015625, -3.35498046875, -3.21966552734375, -3.0843505859375, -2.94903564453125, -2.813720703125, -2.67840576171875, -2.5430908203125, -2.40777587890625, -2.2724609375, -2.13714599609375, -2.0018310546875, -1.86651611328125, -1.731201171875, -1.59588623046875, -1.4605712890625, -1.32525634765625, -1.18994140625, -1.05462646484375, -0.9193115234375, -0.78399658203125, -0.648681640625, -0.51336669921875, -0.3780517578125, -0.24273681640625, -0.107421875, 0.02789306640625, 0.1632080078125, 0.29852294921875, 0.433837890625, 0.56915283203125, 0.7044677734375, 0.83978271484375, 0.97509765625, 1.11041259765625, 1.2457275390625, 1.38104248046875, 1.516357421875, 1.65167236328125, 1.7869873046875, 1.92230224609375, 2.0576171875, 2.19293212890625, 2.3282470703125, 2.46356201171875, 2.598876953125, 2.73419189453125, 2.8695068359375, 3.00482177734375, 3.14013671875, 3.27545166015625, 3.4107666015625, 3.54608154296875, 3.681396484375, 3.81671142578125, 3.9520263671875, 4.08734130859375, 4.22265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 8.0, 8.0, 8.0, 15.0, 21.0, 15.0, 32.0, 34.0, 38.0, 42.0, 29.0, 46.0, 52.0, 77.0, 119.0, 378.0, 1547.0, 127.0, 72.0, 60.0, 39.0, 39.0, 38.0, 37.0, 25.0, 28.0, 23.0, 20.0, 15.0, 13.0, 9.0, 7.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.15625, -24.458251953125, -23.76025390625, -23.062255859375, -22.3642578125, -21.666259765625, -20.96826171875, -20.270263671875, -19.572265625, -18.874267578125, -18.17626953125, -17.478271484375, -16.7802734375, -16.082275390625, -15.38427734375, -14.686279296875, -13.98828125, -13.290283203125, -12.59228515625, -11.894287109375, -11.1962890625, -10.498291015625, -9.80029296875, -9.102294921875, -8.404296875, -7.706298828125, -7.00830078125, -6.310302734375, -5.6123046875, -4.914306640625, -4.21630859375, -3.518310546875, -2.8203125, -2.122314453125, -1.42431640625, -0.726318359375, -0.0283203125, 0.669677734375, 1.36767578125, 2.065673828125, 2.763671875, 3.461669921875, 4.15966796875, 4.857666015625, 5.5556640625, 6.253662109375, 6.95166015625, 7.649658203125, 8.34765625, 9.045654296875, 9.74365234375, 10.441650390625, 11.1396484375, 11.837646484375, 12.53564453125, 13.233642578125, 13.931640625, 14.629638671875, 15.32763671875, 16.025634765625, 16.7236328125, 17.421630859375, 18.11962890625, 18.817626953125, 19.515625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 5.0, 9.0, 9.0, 15.0, 15.0, 19.0, 23.0, 39.0, 39.0, 74.0, 81.0, 125.0, 171.0, 253.0, 346.0, 888.0, 10930.0, 3099927.0, 30191.0, 1181.0, 438.0, 251.0, 173.0, 145.0, 82.0, 74.0, 53.0, 44.0, 25.0, 19.0, 13.0, 15.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.9375, -51.20703125, -49.4765625, -47.74609375, -46.015625, -44.28515625, -42.5546875, -40.82421875, -39.09375, -37.36328125, -35.6328125, -33.90234375, -32.171875, -30.44140625, -28.7109375, -26.98046875, -25.25, -23.51953125, -21.7890625, -20.05859375, -18.328125, -16.59765625, -14.8671875, -13.13671875, -11.40625, -9.67578125, -7.9453125, -6.21484375, -4.484375, -2.75390625, -1.0234375, 0.70703125, 2.4375, 4.16796875, 5.8984375, 7.62890625, 9.359375, 11.08984375, 12.8203125, 14.55078125, 16.28125, 18.01171875, 19.7421875, 21.47265625, 23.203125, 24.93359375, 26.6640625, 28.39453125, 30.125, 31.85546875, 33.5859375, 35.31640625, 37.046875, 38.77734375, 40.5078125, 42.23828125, 43.96875, 45.69921875, 47.4296875, 49.16015625, 50.890625, 52.62109375, 54.3515625, 56.08203125, 57.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 25.0, 267.0, 566.0, 147.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.9264678955078, -152.76657104492188, -149.606689453125, -146.44679260253906, -143.28689575195312, -140.1269989013672, -136.96710205078125, -133.80722045898438, -130.64732360839844, -127.4874267578125, -124.3275375366211, -121.16764831542969, -118.00775146484375, -114.84785461425781, -111.6879653930664, -108.528076171875, -105.36817932128906, -102.20828247070312, -99.04839324951172, -95.88850402832031, -92.72860717773438, -89.56871032714844, -86.40882110595703, -83.24893188476562, -80.08903503417969, -76.92913818359375, -73.76924896240234, -70.60935974121094, -67.449462890625, -64.28956604003906, -61.129676818847656, -57.969783782958984, -54.80989456176758, -51.650001525878906, -48.490108489990234, -45.33021545410156, -42.17032241821289, -39.01042938232422, -35.85053634643555, -32.690643310546875, -29.530750274658203, -26.37085723876953, -23.21096420288086, -20.051071166992188, -16.891178131103516, -13.731285095214844, -10.571392059326172, -7.4114990234375, -4.251605987548828, -1.0917129516601562, 2.0681800842285156, 5.2280731201171875, 8.38796615600586, 11.547859191894531, 14.707752227783203, 17.867645263671875, 21.027538299560547, 24.18743133544922, 27.34732437133789, 30.507217407226562, 33.667110443115234, 36.827003479003906, 39.98689651489258, 43.14678955078125, 46.30668258666992]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 1.0, 6.0, 7.0, 10.0, 9.0, 15.0, 20.0, 9.0, 15.0, 25.0, 21.0, 35.0, 27.0, 41.0, 35.0, 34.0, 39.0, 34.0, 36.0, 35.0, 36.0, 46.0, 26.0, 41.0, 42.0, 35.0, 34.0, 30.0, 28.0, 37.0, 27.0, 17.0, 17.0, 19.0, 10.0, 21.0, 14.0, 9.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-41.557090759277344, -40.16460418701172, -38.772117614746094, -37.379634857177734, -35.98714828491211, -34.594661712646484, -33.20217514038086, -31.809690475463867, -30.417205810546875, -29.02471923828125, -27.632234573364258, -26.239748001098633, -24.84726333618164, -23.454776763916016, -22.06229019165039, -20.6698055267334, -19.277318954467773, -17.88483238220215, -16.492347717285156, -15.099861145019531, -13.707376480102539, -12.314889907836914, -10.922404289245605, -9.529918670654297, -8.137433052062988, -6.74494743347168, -5.352461814880371, -3.9599757194519043, -2.5674901008605957, -1.175004482269287, 0.2174816131591797, 1.6099672317504883, 3.002452850341797, 4.3949384689331055, 5.787424087524414, 7.179910182952881, 8.572395324707031, 9.964881896972656, 11.357367515563965, 12.749853134155273, 14.142338752746582, 15.53482437133789, 16.927310943603516, 18.319795608520508, 19.712282180786133, 21.104766845703125, 22.49725341796875, 23.889739990234375, 25.282224655151367, 26.674711227416992, 28.067195892333984, 29.45968246459961, 30.8521671295166, 32.244651794433594, 33.63713836669922, 35.029624938964844, 36.42211151123047, 37.814598083496094, 39.20708465576172, 40.59956741333008, 41.9920539855957, 43.38454055786133, 44.77702713012695, 46.16950988769531, 47.56199645996094]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 3.0, 3.0, 8.0, 12.0, 12.0, 11.0, 10.0, 13.0, 23.0, 22.0, 22.0, 25.0, 36.0, 40.0, 39.0, 40.0, 36.0, 35.0, 30.0, 48.0, 37.0, 36.0, 36.0, 44.0, 36.0, 38.0, 30.0, 32.0, 25.0, 15.0, 29.0, 21.0, 19.0, 12.0, 25.0, 15.0, 8.0, 12.0, 9.0, 14.0, 2.0, 8.0, 5.0, 1.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.00390625, -4.83209228515625, -4.6602783203125, -4.48846435546875, -4.316650390625, -4.14483642578125, -3.9730224609375, -3.80120849609375, -3.62939453125, -3.45758056640625, -3.2857666015625, -3.11395263671875, -2.942138671875, -2.77032470703125, -2.5985107421875, -2.42669677734375, -2.2548828125, -2.08306884765625, -1.9112548828125, -1.73944091796875, -1.567626953125, -1.39581298828125, -1.2239990234375, -1.05218505859375, -0.88037109375, -0.70855712890625, -0.5367431640625, -0.36492919921875, -0.193115234375, -0.02130126953125, 0.1505126953125, 0.32232666015625, 0.494140625, 0.66595458984375, 0.8377685546875, 1.00958251953125, 1.181396484375, 1.35321044921875, 1.5250244140625, 1.69683837890625, 1.86865234375, 2.04046630859375, 2.2122802734375, 2.38409423828125, 2.555908203125, 2.72772216796875, 2.8995361328125, 3.07135009765625, 3.2431640625, 3.41497802734375, 3.5867919921875, 3.75860595703125, 3.930419921875, 4.10223388671875, 4.2740478515625, 4.44586181640625, 4.61767578125, 4.78948974609375, 4.9613037109375, 5.13311767578125, 5.304931640625, 5.47674560546875, 5.6485595703125, 5.82037353515625, 5.9921875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 5.0, 14.0, 11.0, 16.0, 11.0, 24.0, 30.0, 25.0, 42.0, 39.0, 70.0, 127.0, 237.0, 568.0, 1657.0, 7861.0, 94360.0, 1989567.0, 2003021.0, 86607.0, 7240.0, 1545.0, 517.0, 231.0, 116.0, 58.0, 49.0, 41.0, 30.0, 21.0, 17.0, 23.0, 13.0, 10.0, 9.0, 8.0, 11.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.8125, -16.232666015625, -15.65283203125, -15.072998046875, -14.4931640625, -13.913330078125, -13.33349609375, -12.753662109375, -12.173828125, -11.593994140625, -11.01416015625, -10.434326171875, -9.8544921875, -9.274658203125, -8.69482421875, -8.114990234375, -7.53515625, -6.955322265625, -6.37548828125, -5.795654296875, -5.2158203125, -4.635986328125, -4.05615234375, -3.476318359375, -2.896484375, -2.316650390625, -1.73681640625, -1.156982421875, -0.5771484375, 0.002685546875, 0.58251953125, 1.162353515625, 1.7421875, 2.322021484375, 2.90185546875, 3.481689453125, 4.0615234375, 4.641357421875, 5.22119140625, 5.801025390625, 6.380859375, 6.960693359375, 7.54052734375, 8.120361328125, 8.7001953125, 9.280029296875, 9.85986328125, 10.439697265625, 11.01953125, 11.599365234375, 12.17919921875, 12.759033203125, 13.3388671875, 13.918701171875, 14.49853515625, 15.078369140625, 15.658203125, 16.238037109375, 16.81787109375, 17.397705078125, 17.9775390625, 18.557373046875, 19.13720703125, 19.717041015625, 20.296875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 3.0, 6.0, 8.0, 11.0, 16.0, 9.0, 24.0, 33.0, 43.0, 56.0, 67.0, 85.0, 114.0, 119.0, 180.0, 190.0, 273.0, 331.0, 376.0, 415.0, 360.0, 294.0, 254.0, 189.0, 149.0, 121.0, 83.0, 64.0, 45.0, 27.0, 25.0, 26.0, 14.0, 17.0, 12.0, 10.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.578125, -9.2606201171875, -8.943115234375, -8.6256103515625, -8.30810546875, -7.9906005859375, -7.673095703125, -7.3555908203125, -7.0380859375, -6.7205810546875, -6.403076171875, -6.0855712890625, -5.76806640625, -5.4505615234375, -5.133056640625, -4.8155517578125, -4.498046875, -4.1805419921875, -3.863037109375, -3.5455322265625, -3.22802734375, -2.9105224609375, -2.593017578125, -2.2755126953125, -1.9580078125, -1.6405029296875, -1.322998046875, -1.0054931640625, -0.68798828125, -0.3704833984375, -0.052978515625, 0.2645263671875, 0.58203125, 0.8995361328125, 1.217041015625, 1.5345458984375, 1.85205078125, 2.1695556640625, 2.487060546875, 2.8045654296875, 3.1220703125, 3.4395751953125, 3.757080078125, 4.0745849609375, 4.39208984375, 4.7095947265625, 5.027099609375, 5.3446044921875, 5.662109375, 5.9796142578125, 6.297119140625, 6.6146240234375, 6.93212890625, 7.2496337890625, 7.567138671875, 7.8846435546875, 8.2021484375, 8.5196533203125, 8.837158203125, 9.1546630859375, 9.47216796875, 9.7896728515625, 10.107177734375, 10.4246826171875, 10.7421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 10.0, 10.0, 21.0, 19.0, 20.0, 43.0, 33.0, 59.0, 69.0, 83.0, 136.0, 176.0, 236.0, 290.0, 419.0, 1103.0, 15217.0, 3177819.0, 989973.0, 6206.0, 761.0, 353.0, 271.0, 202.0, 157.0, 151.0, 102.0, 79.0, 65.0, 44.0, 33.0, 27.0, 22.0, 16.0, 15.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-49.375, -47.87353515625, -46.3720703125, -44.87060546875, -43.369140625, -41.86767578125, -40.3662109375, -38.86474609375, -37.36328125, -35.86181640625, -34.3603515625, -32.85888671875, -31.357421875, -29.85595703125, -28.3544921875, -26.85302734375, -25.3515625, -23.85009765625, -22.3486328125, -20.84716796875, -19.345703125, -17.84423828125, -16.3427734375, -14.84130859375, -13.33984375, -11.83837890625, -10.3369140625, -8.83544921875, -7.333984375, -5.83251953125, -4.3310546875, -2.82958984375, -1.328125, 0.17333984375, 1.6748046875, 3.17626953125, 4.677734375, 6.17919921875, 7.6806640625, 9.18212890625, 10.68359375, 12.18505859375, 13.6865234375, 15.18798828125, 16.689453125, 18.19091796875, 19.6923828125, 21.19384765625, 22.6953125, 24.19677734375, 25.6982421875, 27.19970703125, 28.701171875, 30.20263671875, 31.7041015625, 33.20556640625, 34.70703125, 36.20849609375, 37.7099609375, 39.21142578125, 40.712890625, 42.21435546875, 43.7158203125, 45.21728515625, 46.71875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 15.0, 23.0, 44.0, 81.0, 90.0, 97.0, 110.0, 111.0, 112.0, 89.0, 68.0, 50.0, 35.0, 27.0, 20.0, 12.0, 3.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.89492797851562, -65.3831558227539, -63.87138748168945, -62.359619140625, -60.84785079956055, -59.336082458496094, -57.824310302734375, -56.31254196166992, -54.80077362060547, -53.289005279541016, -51.7772331237793, -50.265464782714844, -48.75369644165039, -47.24192810058594, -45.73015594482422, -44.218387603759766, -42.70661544799805, -41.194847106933594, -39.683074951171875, -38.17130661010742, -36.65953826904297, -35.14776611328125, -33.6359977722168, -32.124229431152344, -30.612459182739258, -29.100688934326172, -27.58892059326172, -26.077150344848633, -24.565380096435547, -23.053611755371094, -21.541841506958008, -20.030071258544922, -18.518306732177734, -17.00653648376465, -15.494768142700195, -13.98299789428711, -12.47122859954834, -10.95945930480957, -9.447689056396484, -7.935919761657715, -6.424150466918945, -4.912381172180176, -3.400611400604248, -1.8888416290283203, -0.3770723342895508, 1.1346969604492188, 2.6464672088623047, 4.158236503601074, 5.670005798339844, 7.181775093078613, 8.693544387817383, 10.205314636230469, 11.717083930969238, 13.228853225708008, 14.740623474121094, 16.252391815185547, 17.764162063598633, 19.27593231201172, 20.787700653076172, 22.299470901489258, 23.811241149902344, 25.323009490966797, 26.834779739379883, 28.34654998779297, 29.858318328857422]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 5.0, 8.0, 6.0, 10.0, 14.0, 19.0, 20.0, 16.0, 22.0, 33.0, 34.0, 26.0, 31.0, 48.0, 38.0, 49.0, 49.0, 36.0, 53.0, 44.0, 45.0, 29.0, 49.0, 42.0, 49.0, 38.0, 22.0, 34.0, 23.0, 23.0, 16.0, 16.0, 17.0, 14.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.432861328125, -41.165992736816406, -39.89912414550781, -38.63225555419922, -37.365386962890625, -36.09851837158203, -34.83164978027344, -33.56478500366211, -32.297916412353516, -31.031047821044922, -29.764179229736328, -28.497310638427734, -27.230443954467773, -25.96357536315918, -24.696706771850586, -23.429840087890625, -22.1629695892334, -20.896100997924805, -19.62923240661621, -18.36236572265625, -17.095497131347656, -15.828628540039062, -14.561759948730469, -13.294892311096191, -12.028023719787598, -10.761155128479004, -9.494287490844727, -8.227418899536133, -6.960550785064697, -5.693682670593262, -4.426814079284668, -3.1599464416503906, -1.8930778503417969, -0.6262096166610718, 0.6406586170196533, 1.907526969909668, 3.1743950843811035, 4.441263198852539, 5.708131790161133, 6.97499942779541, 8.241868019104004, 9.508736610412598, 10.775604248046875, 12.042472839355469, 13.309341430664062, 14.57620906829834, 15.843077659606934, 17.10994529724121, 18.376813888549805, 19.6436824798584, 20.910551071166992, 22.177417755126953, 23.444286346435547, 24.71115493774414, 25.978023529052734, 27.244892120361328, 28.511760711669922, 29.778629302978516, 31.04549789428711, 32.3123664855957, 33.5792350769043, 34.846099853515625, 36.11296844482422, 37.37983703613281, 38.646705627441406]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 4.0, 5.0, 12.0, 13.0, 12.0, 20.0, 20.0, 21.0, 19.0, 23.0, 31.0, 41.0, 32.0, 40.0, 48.0, 48.0, 47.0, 42.0, 39.0, 33.0, 38.0, 38.0, 50.0, 37.0, 39.0, 41.0, 31.0, 17.0, 21.0, 21.0, 16.0, 14.0, 12.0, 19.0, 13.0, 7.0, 4.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.368896484375, -5.17529296875, -4.981689453125, -4.7880859375, -4.594482421875, -4.40087890625, -4.207275390625, -4.013671875, -3.820068359375, -3.62646484375, -3.432861328125, -3.2392578125, -3.045654296875, -2.85205078125, -2.658447265625, -2.46484375, -2.271240234375, -2.07763671875, -1.884033203125, -1.6904296875, -1.496826171875, -1.30322265625, -1.109619140625, -0.916015625, -0.722412109375, -0.52880859375, -0.335205078125, -0.1416015625, 0.052001953125, 0.24560546875, 0.439208984375, 0.6328125, 0.826416015625, 1.02001953125, 1.213623046875, 1.4072265625, 1.600830078125, 1.79443359375, 1.988037109375, 2.181640625, 2.375244140625, 2.56884765625, 2.762451171875, 2.9560546875, 3.149658203125, 3.34326171875, 3.536865234375, 3.73046875, 3.924072265625, 4.11767578125, 4.311279296875, 4.5048828125, 4.698486328125, 4.89208984375, 5.085693359375, 5.279296875, 5.472900390625, 5.66650390625, 5.860107421875, 6.0537109375, 6.247314453125, 6.44091796875, 6.634521484375, 6.828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 7.0, 6.0, 10.0, 21.0, 35.0, 47.0, 70.0, 111.0, 176.0, 284.0, 396.0, 537.0, 712.0, 992.0, 1452.0, 1996.0, 2907.0, 4023.0, 5838.0, 8179.0, 11893.0, 16777.0, 25118.0, 37921.0, 56728.0, 85364.0, 123093.0, 159067.0, 151779.0, 114521.0, 77385.0, 51808.0, 34398.0, 22963.0, 15911.0, 10539.0, 7409.0, 5138.0, 3853.0, 2641.0, 1908.0, 1409.0, 978.0, 701.0, 500.0, 331.0, 223.0, 159.0, 100.0, 60.0, 34.0, 21.0, 14.0, 11.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.462890625, -0.4479026794433594, -0.43291473388671875, -0.4179267883300781, -0.4029388427734375, -0.3879508972167969, -0.37296295166015625, -0.3579750061035156, -0.342987060546875, -0.3279991149902344, -0.31301116943359375, -0.2980232238769531, -0.2830352783203125, -0.2680473327636719, -0.25305938720703125, -0.23807144165039062, -0.22308349609375, -0.20809555053710938, -0.19310760498046875, -0.17811965942382812, -0.1631317138671875, -0.14814376831054688, -0.13315582275390625, -0.11816787719726562, -0.103179931640625, -0.08819198608398438, -0.07320404052734375, -0.058216094970703125, -0.0432281494140625, -0.028240203857421875, -0.01325225830078125, 0.001735687255859375, 0.0167236328125, 0.031711578369140625, 0.04669952392578125, 0.061687469482421875, 0.0766754150390625, 0.09166336059570312, 0.10665130615234375, 0.12163925170898438, 0.136627197265625, 0.15161514282226562, 0.16660308837890625, 0.18159103393554688, 0.1965789794921875, 0.21156692504882812, 0.22655487060546875, 0.24154281616210938, 0.25653076171875, 0.2715187072753906, 0.28650665283203125, 0.3014945983886719, 0.3164825439453125, 0.3314704895019531, 0.34645843505859375, 0.3614463806152344, 0.376434326171875, 0.3914222717285156, 0.40641021728515625, 0.4213981628417969, 0.4363861083984375, 0.4513740539550781, 0.46636199951171875, 0.4813499450683594, 0.496337890625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 0.0, 5.0, 14.0, 3.0, 13.0, 23.0, 19.0, 11.0, 14.0, 20.0, 22.0, 34.0, 25.0, 30.0, 28.0, 33.0, 46.0, 45.0, 50.0, 39.0, 1068.0, 43.0, 48.0, 33.0, 52.0, 37.0, 26.0, 42.0, 32.0, 25.0, 22.0, 21.0, 23.0, 20.0, 16.0, 9.0, 12.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.921875, -3.801544189453125, -3.68121337890625, -3.560882568359375, -3.4405517578125, -3.320220947265625, -3.19989013671875, -3.079559326171875, -2.959228515625, -2.838897705078125, -2.71856689453125, -2.598236083984375, -2.4779052734375, -2.357574462890625, -2.23724365234375, -2.116912841796875, -1.99658203125, -1.876251220703125, -1.75592041015625, -1.635589599609375, -1.5152587890625, -1.394927978515625, -1.27459716796875, -1.154266357421875, -1.033935546875, -0.913604736328125, -0.79327392578125, -0.672943115234375, -0.5526123046875, -0.432281494140625, -0.31195068359375, -0.191619873046875, -0.0712890625, 0.049041748046875, 0.16937255859375, 0.289703369140625, 0.4100341796875, 0.530364990234375, 0.65069580078125, 0.771026611328125, 0.891357421875, 1.011688232421875, 1.13201904296875, 1.252349853515625, 1.3726806640625, 1.493011474609375, 1.61334228515625, 1.733673095703125, 1.85400390625, 1.974334716796875, 2.09466552734375, 2.214996337890625, 2.3353271484375, 2.455657958984375, 2.57598876953125, 2.696319580078125, 2.816650390625, 2.936981201171875, 3.05731201171875, 3.177642822265625, 3.2979736328125, 3.418304443359375, 3.53863525390625, 3.658966064453125, 3.779296875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 15.0, 5.0, 20.0, 23.0, 35.0, 51.0, 81.0, 135.0, 167.0, 306.0, 461.0, 690.0, 993.0, 1725.0, 2671.0, 4385.0, 6999.0, 11315.0, 18677.0, 31039.0, 51568.0, 86258.0, 134615.0, 1079756.0, 320367.0, 132429.0, 84643.0, 50672.0, 29871.0, 17811.0, 10972.0, 6802.0, 4199.0, 2680.0, 1696.0, 1031.0, 694.0, 442.0, 287.0, 181.0, 123.0, 90.0, 60.0, 35.0, 19.0, 14.0, 12.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4401512145996094, -0.42546844482421875, -0.4107856750488281, -0.3961029052734375, -0.3814201354980469, -0.36673736572265625, -0.3520545959472656, -0.337371826171875, -0.3226890563964844, -0.30800628662109375, -0.2933235168457031, -0.2786407470703125, -0.2639579772949219, -0.24927520751953125, -0.23459243774414062, -0.21990966796875, -0.20522689819335938, -0.19054412841796875, -0.17586135864257812, -0.1611785888671875, -0.14649581909179688, -0.13181304931640625, -0.11713027954101562, -0.102447509765625, -0.08776473999023438, -0.07308197021484375, -0.058399200439453125, -0.0437164306640625, -0.029033660888671875, -0.01435089111328125, 0.000331878662109375, 0.0150146484375, 0.029697418212890625, 0.04438018798828125, 0.059062957763671875, 0.0737457275390625, 0.08842849731445312, 0.10311126708984375, 0.11779403686523438, 0.132476806640625, 0.14715957641601562, 0.16184234619140625, 0.17652511596679688, 0.1912078857421875, 0.20589065551757812, 0.22057342529296875, 0.23525619506835938, 0.24993896484375, 0.2646217346191406, 0.27930450439453125, 0.2939872741699219, 0.3086700439453125, 0.3233528137207031, 0.33803558349609375, 0.3527183532714844, 0.367401123046875, 0.3820838928222656, 0.39676666259765625, 0.4114494323730469, 0.4261322021484375, 0.4408149719238281, 0.45549774169921875, 0.4701805114746094, 0.48486328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 8.0, 9.0, 15.0, 11.0, 17.0, 24.0, 16.0, 20.0, 35.0, 24.0, 32.0, 44.0, 44.0, 62.0, 51.0, 52.0, 52.0, 71.0, 55.0, 52.0, 40.0, 45.0, 41.0, 29.0, 24.0, 18.0, 20.0, 20.0, 13.0, 6.0, 7.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00136566162109375, -0.0013147294521331787, -0.0012637972831726074, -0.0012128651142120361, -0.0011619329452514648, -0.0011110007762908936, -0.0010600686073303223, -0.001009136438369751, -0.0009582042694091797, -0.0009072721004486084, -0.0008563399314880371, -0.0008054077625274658, -0.0007544755935668945, -0.0007035434246063232, -0.000652611255645752, -0.0006016790866851807, -0.0005507469177246094, -0.0004998147487640381, -0.0004488825798034668, -0.0003979504108428955, -0.0003470182418823242, -0.00029608607292175293, -0.00024515390396118164, -0.00019422173500061035, -0.00014328956604003906, -9.235739707946777e-05, -4.1425228118896484e-05, 9.506940841674805e-06, 6.0439109802246094e-05, 0.00011137127876281738, 0.00016230344772338867, 0.00021323561668395996, 0.00026416778564453125, 0.00031509995460510254, 0.00036603212356567383, 0.0004169642925262451, 0.0004678964614868164, 0.0005188286304473877, 0.000569760799407959, 0.0006206929683685303, 0.0006716251373291016, 0.0007225573062896729, 0.0007734894752502441, 0.0008244216442108154, 0.0008753538131713867, 0.000926285982131958, 0.0009772181510925293, 0.0010281503200531006, 0.0010790824890136719, 0.0011300146579742432, 0.0011809468269348145, 0.0012318789958953857, 0.001282811164855957, 0.0013337433338165283, 0.0013846755027770996, 0.001435607671737671, 0.0014865398406982422, 0.0015374720096588135, 0.0015884041786193848, 0.001639336347579956, 0.0016902685165405273, 0.0017412006855010986, 0.00179213285446167, 0.0018430650234222412, 0.0018939971923828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 11.0, 11.0, 9.0, 13.0, 14.0, 17.0, 26.0, 31.0, 33.0, 52.0, 69.0, 82.0, 99.0, 155.0, 261.0, 656.0, 5288.0, 993884.0, 45901.0, 968.0, 341.0, 161.0, 102.0, 80.0, 58.0, 43.0, 29.0, 34.0, 21.0, 28.0, 18.0, 8.0, 10.0, 15.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.037967681884765625, -0.03690338134765625, -0.035839080810546875, -0.0347747802734375, -0.033710479736328125, -0.03264617919921875, -0.031581878662109375, -0.030517578125, -0.029453277587890625, -0.02838897705078125, -0.027324676513671875, -0.0262603759765625, -0.025196075439453125, -0.02413177490234375, -0.023067474365234375, -0.022003173828125, -0.020938873291015625, -0.01987457275390625, -0.018810272216796875, -0.0177459716796875, -0.016681671142578125, -0.01561737060546875, -0.014553070068359375, -0.01348876953125, -0.012424468994140625, -0.01136016845703125, -0.010295867919921875, -0.0092315673828125, -0.008167266845703125, -0.00710296630859375, -0.006038665771484375, -0.004974365234375, -0.003910064697265625, -0.00284576416015625, -0.001781463623046875, -0.0007171630859375, 0.000347137451171875, 0.00141143798828125, 0.002475738525390625, 0.0035400390625, 0.004604339599609375, 0.00566864013671875, 0.006732940673828125, 0.0077972412109375, 0.008861541748046875, 0.00992584228515625, 0.010990142822265625, 0.012054443359375, 0.013118743896484375, 0.01418304443359375, 0.015247344970703125, 0.0163116455078125, 0.017375946044921875, 0.01844024658203125, 0.019504547119140625, 0.02056884765625, 0.021633148193359375, 0.02269744873046875, 0.023761749267578125, 0.0248260498046875, 0.025890350341796875, 0.02695465087890625, 0.028018951416015625, 0.029083251953125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 94.0, 301.0, 422.0, 161.0, 24.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021073613315820694, -0.0019686666782945395, -0.0018299721414223313, -0.0016912776045501232, -0.0015525829512625933, -0.0014138884143903852, -0.001275193877518177, -0.001136499224230647, -0.000997804687358439, -0.0008591100922785699, -0.0007204154971987009, -0.0005817209603264928, -0.00044302636524662375, -0.0003043317701667547, -0.0001656372332945466, -2.6942638214677572e-05, 0.00011175195686519146, 0.0002504465519450605, 0.00038914111792109907, 0.0005278356838971376, 0.0006665302789770067, 0.0008052248740568757, 0.0009439194109290838, 0.0010826140642166138, 0.0012213086010888219, 0.00136000313796103, 0.00149869779124856, 0.001637392328120768, 0.0017760868649929762, 0.0019147815182805061, 0.0020534759387373924, 0.0021921705920249224, 0.0023308652453124523, 0.0024695598985999823, 0.0026082543190568686, 0.0027469489723443985, 0.0028856436256319284, 0.0030243382789194584, 0.0031630326993763447, 0.0033017273526638746, 0.0034404220059514046, 0.0035791166592389345, 0.003717811079695821, 0.0038565057329833508, 0.003995200153440237, 0.004133895039558411, 0.004272589460015297, 0.004411283880472183, 0.0045499783009290695, 0.004688672721385956, 0.004827367607504129, 0.004966062027961016, 0.005104756448417902, 0.005243451334536076, 0.005382145754992962, 0.005520840175449848, 0.005659535061568022, 0.005798229482024908, 0.005936924368143082, 0.006075618788599968, 0.006214313209056854, 0.006353008095175028, 0.006491702515631914, 0.0066303969360888, 0.006769091822206974]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 9.0, 3.0, 9.0, 8.0, 13.0, 15.0, 15.0, 17.0, 22.0, 26.0, 28.0, 26.0, 30.0, 32.0, 39.0, 40.0, 34.0, 39.0, 44.0, 53.0, 46.0, 37.0, 39.0, 40.0, 42.0, 31.0, 27.0, 27.0, 25.0, 29.0, 30.0, 25.0, 18.0, 19.0, 10.0, 9.0, 7.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007494688034057617, -0.0007223617285490036, -0.0006952546536922455, -0.0006681475788354874, -0.0006410405039787292, -0.0006139334291219711, -0.000586826354265213, -0.0005597192794084549, -0.0005326122045516968, -0.0005055051296949387, -0.00047839805483818054, -0.0004512909799814224, -0.0004241839051246643, -0.0003970768302679062, -0.00036996975541114807, -0.00034286268055438995, -0.00031575560569763184, -0.0002886485308408737, -0.0002615414559841156, -0.00023443438112735748, -0.00020732730627059937, -0.00018022023141384125, -0.00015311315655708313, -0.000126006081700325, -9.88990068435669e-05, -7.179193198680878e-05, -4.468485713005066e-05, -1.757778227329254e-05, 9.529292583465576e-06, 3.6636367440223694e-05, 6.374344229698181e-05, 9.085051715373993e-05, 0.00011795759201049805, 0.00014506466686725616, 0.00017217174172401428, 0.0001992788165807724, 0.00022638589143753052, 0.00025349296629428864, 0.00028060004115104675, 0.00030770711600780487, 0.000334814190864563, 0.0003619212657213211, 0.0003890283405780792, 0.00041613541543483734, 0.00044324249029159546, 0.0004703495651483536, 0.0004974566400051117, 0.0005245637148618698, 0.0005516707897186279, 0.000578777864575386, 0.0006058849394321442, 0.0006329920142889023, 0.0006600990891456604, 0.0006872061640024185, 0.0007143132388591766, 0.0007414203137159348, 0.0007685273885726929, 0.000795634463429451, 0.0008227415382862091, 0.0008498486131429672, 0.0008769556879997253, 0.0009040627628564835, 0.0009311698377132416, 0.0009582769125699997, 0.0009853839874267578]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 4.0, 5.0, 12.0, 13.0, 12.0, 20.0, 20.0, 21.0, 19.0, 23.0, 31.0, 41.0, 32.0, 40.0, 48.0, 48.0, 47.0, 42.0, 39.0, 33.0, 38.0, 38.0, 50.0, 37.0, 39.0, 41.0, 31.0, 17.0, 21.0, 21.0, 16.0, 14.0, 12.0, 19.0, 13.0, 7.0, 4.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.368896484375, -5.17529296875, -4.981689453125, -4.7880859375, -4.594482421875, -4.40087890625, -4.207275390625, -4.013671875, -3.820068359375, -3.62646484375, -3.432861328125, -3.2392578125, -3.045654296875, -2.85205078125, -2.658447265625, -2.46484375, -2.271240234375, -2.07763671875, -1.884033203125, -1.6904296875, -1.496826171875, -1.30322265625, -1.109619140625, -0.916015625, -0.722412109375, -0.52880859375, -0.335205078125, -0.1416015625, 0.052001953125, 0.24560546875, 0.439208984375, 0.6328125, 0.826416015625, 1.02001953125, 1.213623046875, 1.4072265625, 1.600830078125, 1.79443359375, 1.988037109375, 2.181640625, 2.375244140625, 2.56884765625, 2.762451171875, 2.9560546875, 3.149658203125, 3.34326171875, 3.536865234375, 3.73046875, 3.924072265625, 4.11767578125, 4.311279296875, 4.5048828125, 4.698486328125, 4.89208984375, 5.085693359375, 5.279296875, 5.472900390625, 5.66650390625, 5.860107421875, 6.0537109375, 6.247314453125, 6.44091796875, 6.634521484375, 6.828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 12.0, 27.0, 18.0, 34.0, 37.0, 39.0, 79.0, 81.0, 111.0, 146.0, 231.0, 394.0, 881.0, 1842.0, 4880.0, 12511.0, 34234.0, 96643.0, 308190.0, 397191.0, 122133.0, 42673.0, 15499.0, 5885.0, 2364.0, 1026.0, 488.0, 265.0, 159.0, 87.0, 87.0, 68.0, 39.0, 44.0, 27.0, 25.0, 18.0, 13.0, 16.0, 12.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.796875, -5.61053466796875, -5.4241943359375, -5.23785400390625, -5.051513671875, -4.86517333984375, -4.6788330078125, -4.49249267578125, -4.30615234375, -4.11981201171875, -3.9334716796875, -3.74713134765625, -3.560791015625, -3.37445068359375, -3.1881103515625, -3.00177001953125, -2.8154296875, -2.62908935546875, -2.4427490234375, -2.25640869140625, -2.070068359375, -1.88372802734375, -1.6973876953125, -1.51104736328125, -1.32470703125, -1.13836669921875, -0.9520263671875, -0.76568603515625, -0.579345703125, -0.39300537109375, -0.2066650390625, -0.02032470703125, 0.166015625, 0.35235595703125, 0.5386962890625, 0.72503662109375, 0.911376953125, 1.09771728515625, 1.2840576171875, 1.47039794921875, 1.65673828125, 1.84307861328125, 2.0294189453125, 2.21575927734375, 2.402099609375, 2.58843994140625, 2.7747802734375, 2.96112060546875, 3.1474609375, 3.33380126953125, 3.5201416015625, 3.70648193359375, 3.892822265625, 4.07916259765625, 4.2655029296875, 4.45184326171875, 4.63818359375, 4.82452392578125, 5.0108642578125, 5.19720458984375, 5.383544921875, 5.56988525390625, 5.7562255859375, 5.94256591796875, 6.12890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 1.0, 8.0, 6.0, 8.0, 10.0, 13.0, 11.0, 17.0, 21.0, 22.0, 34.0, 25.0, 37.0, 53.0, 45.0, 61.0, 63.0, 78.0, 345.0, 1576.0, 167.0, 48.0, 70.0, 41.0, 36.0, 35.0, 34.0, 31.0, 17.0, 27.0, 21.0, 17.0, 16.0, 11.0, 11.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.65625, -21.00439453125, -20.3525390625, -19.70068359375, -19.048828125, -18.39697265625, -17.7451171875, -17.09326171875, -16.44140625, -15.78955078125, -15.1376953125, -14.48583984375, -13.833984375, -13.18212890625, -12.5302734375, -11.87841796875, -11.2265625, -10.57470703125, -9.9228515625, -9.27099609375, -8.619140625, -7.96728515625, -7.3154296875, -6.66357421875, -6.01171875, -5.35986328125, -4.7080078125, -4.05615234375, -3.404296875, -2.75244140625, -2.1005859375, -1.44873046875, -0.796875, -0.14501953125, 0.5068359375, 1.15869140625, 1.810546875, 2.46240234375, 3.1142578125, 3.76611328125, 4.41796875, 5.06982421875, 5.7216796875, 6.37353515625, 7.025390625, 7.67724609375, 8.3291015625, 8.98095703125, 9.6328125, 10.28466796875, 10.9365234375, 11.58837890625, 12.240234375, 12.89208984375, 13.5439453125, 14.19580078125, 14.84765625, 15.49951171875, 16.1513671875, 16.80322265625, 17.455078125, 18.10693359375, 18.7587890625, 19.41064453125, 20.0625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 5.0, 4.0, 5.0, 5.0, 11.0, 13.0, 12.0, 16.0, 27.0, 29.0, 34.0, 28.0, 48.0, 54.0, 75.0, 106.0, 131.0, 176.0, 320.0, 559.0, 1230.0, 8405.0, 2930686.0, 198406.0, 2968.0, 831.0, 467.0, 280.0, 174.0, 120.0, 100.0, 75.0, 40.0, 55.0, 45.0, 30.0, 22.0, 16.0, 13.0, 14.0, 11.0, 9.0, 11.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.09375, -39.759765625, -38.42578125, -37.091796875, -35.7578125, -34.423828125, -33.08984375, -31.755859375, -30.421875, -29.087890625, -27.75390625, -26.419921875, -25.0859375, -23.751953125, -22.41796875, -21.083984375, -19.75, -18.416015625, -17.08203125, -15.748046875, -14.4140625, -13.080078125, -11.74609375, -10.412109375, -9.078125, -7.744140625, -6.41015625, -5.076171875, -3.7421875, -2.408203125, -1.07421875, 0.259765625, 1.59375, 2.927734375, 4.26171875, 5.595703125, 6.9296875, 8.263671875, 9.59765625, 10.931640625, 12.265625, 13.599609375, 14.93359375, 16.267578125, 17.6015625, 18.935546875, 20.26953125, 21.603515625, 22.9375, 24.271484375, 25.60546875, 26.939453125, 28.2734375, 29.607421875, 30.94140625, 32.275390625, 33.609375, 34.943359375, 36.27734375, 37.611328125, 38.9453125, 40.279296875, 41.61328125, 42.947265625, 44.28125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [2.0, 17.0, 555.0, 435.0, 11.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.344505310058594, -9.471978187561035, -4.599451065063477, 0.27307605743408203, 5.145603179931641, 10.018131256103516, 14.890657424926758, 19.76318359375, 24.635711669921875, 29.50823974609375, 34.380767822265625, 39.253292083740234, 44.12582015991211, 48.998348236083984, 53.870872497558594, 58.74340057373047, 63.615928649902344, 68.48845672607422, 73.3609848022461, 78.23351287841797, 83.10603332519531, 87.97856140136719, 92.85108947753906, 97.72361755371094, 102.59614562988281, 107.46867370605469, 112.34120178222656, 117.21372985839844, 122.08625793457031, 126.95878601074219, 131.83131408691406, 136.70382690429688, 141.57635498046875, 146.44888305664062, 151.3214111328125, 156.19393920898438, 161.06646728515625, 165.93899536132812, 170.8115234375, 175.68405151367188, 180.55657958984375, 185.42910766601562, 190.3016357421875, 195.17416381835938, 200.04669189453125, 204.91921997070312, 209.791748046875, 214.66427612304688, 219.5367889404297, 224.40931701660156, 229.28184509277344, 234.1543731689453, 239.0269012451172, 243.89942932128906, 248.77195739746094, 253.64447021484375, 258.5169982910156, 263.3895263671875, 268.2620544433594, 273.13458251953125, 278.0071105957031, 282.879638671875, 287.7521667480469, 292.62469482421875, 297.4972229003906]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 9.0, 5.0, 13.0, 13.0, 13.0, 13.0, 21.0, 10.0, 28.0, 23.0, 34.0, 35.0, 29.0, 32.0, 45.0, 37.0, 28.0, 24.0, 37.0, 40.0, 47.0, 35.0, 40.0, 36.0, 40.0, 30.0, 29.0, 30.0, 32.0, 26.0, 20.0, 17.0, 12.0, 18.0, 8.0, 12.0, 12.0, 8.0, 7.0, 8.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-46.500328063964844, -45.11433410644531, -43.72834014892578, -42.342342376708984, -40.95634841918945, -39.57035446166992, -38.184356689453125, -36.798362731933594, -35.41236877441406, -34.02637481689453, -32.640380859375, -31.254383087158203, -29.868389129638672, -28.48239517211914, -27.096399307250977, -25.710403442382812, -24.32440948486328, -22.93841552734375, -21.552419662475586, -20.166423797607422, -18.78042984008789, -17.39443588256836, -16.008440017700195, -14.622445106506348, -13.2364501953125, -11.850455284118652, -10.464460372924805, -9.078465461730957, -7.692470550537109, -6.306475639343262, -4.920480728149414, -3.5344858169555664, -2.1484909057617188, -0.7624959945678711, 0.6234989166259766, 2.009493827819824, 3.395488739013672, 4.7814836502075195, 6.167478561401367, 7.553473472595215, 8.939468383789062, 10.32546329498291, 11.711458206176758, 13.097453117370605, 14.483448028564453, 15.8694429397583, 17.25543785095215, 18.641433715820312, 20.027427673339844, 21.413421630859375, 22.79941749572754, 24.185413360595703, 25.571407318115234, 26.957401275634766, 28.34339714050293, 29.729393005371094, 31.115386962890625, 32.501380920410156, 33.88737487792969, 35.273372650146484, 36.659366607666016, 38.04536056518555, 39.431358337402344, 40.817352294921875, 42.203346252441406]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 14.0, 11.0, 11.0, 17.0, 19.0, 11.0, 21.0, 33.0, 23.0, 27.0, 49.0, 46.0, 48.0, 36.0, 53.0, 38.0, 47.0, 53.0, 35.0, 43.0, 43.0, 38.0, 33.0, 32.0, 28.0, 27.0, 30.0, 23.0, 17.0, 9.0, 15.0, 14.0, 6.0, 7.0, 7.0, 11.0, 7.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1171875, -5.9052734375, -5.693359375, -5.4814453125, -5.26953125, -5.0576171875, -4.845703125, -4.6337890625, -4.421875, -4.2099609375, -3.998046875, -3.7861328125, -3.57421875, -3.3623046875, -3.150390625, -2.9384765625, -2.7265625, -2.5146484375, -2.302734375, -2.0908203125, -1.87890625, -1.6669921875, -1.455078125, -1.2431640625, -1.03125, -0.8193359375, -0.607421875, -0.3955078125, -0.18359375, 0.0283203125, 0.240234375, 0.4521484375, 0.6640625, 0.8759765625, 1.087890625, 1.2998046875, 1.51171875, 1.7236328125, 1.935546875, 2.1474609375, 2.359375, 2.5712890625, 2.783203125, 2.9951171875, 3.20703125, 3.4189453125, 3.630859375, 3.8427734375, 4.0546875, 4.2666015625, 4.478515625, 4.6904296875, 4.90234375, 5.1142578125, 5.326171875, 5.5380859375, 5.75, 5.9619140625, 6.173828125, 6.3857421875, 6.59765625, 6.8095703125, 7.021484375, 7.2333984375, 7.4453125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 5.0, 6.0, 8.0, 6.0, 8.0, 22.0, 13.0, 22.0, 23.0, 27.0, 37.0, 46.0, 82.0, 102.0, 171.0, 370.0, 936.0, 3976.0, 48332.0, 1864019.0, 2211957.0, 57651.0, 4502.0, 958.0, 379.0, 188.0, 106.0, 74.0, 53.0, 40.0, 32.0, 29.0, 21.0, 11.0, 16.0, 11.0, 7.0, 6.0, 7.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.83447265625, -18.1376953125, -17.44091796875, -16.744140625, -16.04736328125, -15.3505859375, -14.65380859375, -13.95703125, -13.26025390625, -12.5634765625, -11.86669921875, -11.169921875, -10.47314453125, -9.7763671875, -9.07958984375, -8.3828125, -7.68603515625, -6.9892578125, -6.29248046875, -5.595703125, -4.89892578125, -4.2021484375, -3.50537109375, -2.80859375, -2.11181640625, -1.4150390625, -0.71826171875, -0.021484375, 0.67529296875, 1.3720703125, 2.06884765625, 2.765625, 3.46240234375, 4.1591796875, 4.85595703125, 5.552734375, 6.24951171875, 6.9462890625, 7.64306640625, 8.33984375, 9.03662109375, 9.7333984375, 10.43017578125, 11.126953125, 11.82373046875, 12.5205078125, 13.21728515625, 13.9140625, 14.61083984375, 15.3076171875, 16.00439453125, 16.701171875, 17.39794921875, 18.0947265625, 18.79150390625, 19.48828125, 20.18505859375, 20.8818359375, 21.57861328125, 22.275390625, 22.97216796875, 23.6689453125, 24.36572265625, 25.0625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 11.0, 18.0, 25.0, 31.0, 41.0, 46.0, 84.0, 99.0, 132.0, 200.0, 278.0, 279.0, 405.0, 441.0, 381.0, 369.0, 302.0, 234.0, 147.0, 116.0, 104.0, 68.0, 48.0, 43.0, 35.0, 24.0, 22.0, 11.0, 10.0, 2.0, 3.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.3092041015625, -10.954345703125, -10.5994873046875, -10.24462890625, -9.8897705078125, -9.534912109375, -9.1800537109375, -8.8251953125, -8.4703369140625, -8.115478515625, -7.7606201171875, -7.40576171875, -7.0509033203125, -6.696044921875, -6.3411865234375, -5.986328125, -5.6314697265625, -5.276611328125, -4.9217529296875, -4.56689453125, -4.2120361328125, -3.857177734375, -3.5023193359375, -3.1474609375, -2.7926025390625, -2.437744140625, -2.0828857421875, -1.72802734375, -1.3731689453125, -1.018310546875, -0.6634521484375, -0.30859375, 0.0462646484375, 0.401123046875, 0.7559814453125, 1.11083984375, 1.4656982421875, 1.820556640625, 2.1754150390625, 2.5302734375, 2.8851318359375, 3.239990234375, 3.5948486328125, 3.94970703125, 4.3045654296875, 4.659423828125, 5.0142822265625, 5.369140625, 5.7239990234375, 6.078857421875, 6.4337158203125, 6.78857421875, 7.1434326171875, 7.498291015625, 7.8531494140625, 8.2080078125, 8.5628662109375, 8.917724609375, 9.2725830078125, 9.62744140625, 9.9822998046875, 10.337158203125, 10.6920166015625, 11.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 12.0, 8.0, 17.0, 30.0, 28.0, 46.0, 69.0, 88.0, 103.0, 146.0, 165.0, 229.0, 356.0, 798.0, 7545.0, 1395960.0, 2775578.0, 10612.0, 986.0, 430.0, 283.0, 209.0, 152.0, 108.0, 87.0, 44.0, 49.0, 28.0, 26.0, 19.0, 10.0, 14.0, 5.0, 6.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-59.03125, -57.13037109375, -55.2294921875, -53.32861328125, -51.427734375, -49.52685546875, -47.6259765625, -45.72509765625, -43.82421875, -41.92333984375, -40.0224609375, -38.12158203125, -36.220703125, -34.31982421875, -32.4189453125, -30.51806640625, -28.6171875, -26.71630859375, -24.8154296875, -22.91455078125, -21.013671875, -19.11279296875, -17.2119140625, -15.31103515625, -13.41015625, -11.50927734375, -9.6083984375, -7.70751953125, -5.806640625, -3.90576171875, -2.0048828125, -0.10400390625, 1.796875, 3.69775390625, 5.5986328125, 7.49951171875, 9.400390625, 11.30126953125, 13.2021484375, 15.10302734375, 17.00390625, 18.90478515625, 20.8056640625, 22.70654296875, 24.607421875, 26.50830078125, 28.4091796875, 30.31005859375, 32.2109375, 34.11181640625, 36.0126953125, 37.91357421875, 39.814453125, 41.71533203125, 43.6162109375, 45.51708984375, 47.41796875, 49.31884765625, 51.2197265625, 53.12060546875, 55.021484375, 56.92236328125, 58.8232421875, 60.72412109375, 62.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 7.0, 17.0, 30.0, 69.0, 71.0, 99.0, 132.0, 125.0, 138.0, 107.0, 82.0, 53.0, 24.0, 11.0, 14.0, 10.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.42529296875, -65.57601165771484, -63.72673034667969, -61.87744903564453, -60.02817153930664, -58.178890228271484, -56.32960891723633, -54.48032760620117, -52.63105010986328, -50.781768798828125, -48.93248748779297, -47.08320617675781, -45.23392868041992, -43.384647369384766, -41.53536605834961, -39.68608474731445, -37.8368034362793, -35.98752212524414, -34.138240814208984, -32.288963317871094, -30.439682006835938, -28.59040069580078, -26.741119384765625, -24.89183807373047, -23.042558670043945, -21.19327735900879, -19.343997955322266, -17.49471664428711, -15.64543628692627, -13.79615592956543, -11.946874618530273, -10.097594261169434, -8.248313903808594, -6.399033546447754, -4.549752712249756, -2.700471878051758, -0.851191520690918, 0.9980888366699219, 2.847370147705078, 4.696650505065918, 6.545930862426758, 8.395211219787598, 10.244491577148438, 12.093772888183594, 13.943053245544434, 15.792333602905273, 17.64161491394043, 19.490894317626953, 21.34017562866211, 23.189456939697266, 25.03873634338379, 26.888017654418945, 28.73729705810547, 30.586578369140625, 32.43585968017578, 34.28514099121094, 36.134422302246094, 37.98370361328125, 39.832984924316406, 41.68226623535156, 43.53154373168945, 45.38082504272461, 47.230106353759766, 49.07938766479492, 50.92866516113281]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 9.0, 3.0, 13.0, 13.0, 17.0, 16.0, 16.0, 12.0, 23.0, 22.0, 27.0, 38.0, 35.0, 40.0, 38.0, 29.0, 37.0, 42.0, 49.0, 44.0, 33.0, 41.0, 35.0, 32.0, 31.0, 26.0, 28.0, 24.0, 28.0, 25.0, 22.0, 22.0, 10.0, 12.0, 14.0, 7.0, 14.0, 11.0, 13.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-37.36811828613281, -36.15095520019531, -34.93379211425781, -33.71662902832031, -32.49946594238281, -31.282304763793945, -30.065143585205078, -28.847980499267578, -27.630817413330078, -26.413654327392578, -25.196491241455078, -23.97933006286621, -22.76216697692871, -21.54500389099121, -20.327842712402344, -19.110679626464844, -17.893516540527344, -16.676353454589844, -15.45919132232666, -14.242029190063477, -13.024866104125977, -11.807703018188477, -10.590540885925293, -9.37337875366211, -8.15621566772461, -6.939053058624268, -5.721890449523926, -4.504727840423584, -3.287565231323242, -2.0704026222229004, -0.8532400131225586, 0.363922119140625, 1.581085205078125, 2.798247814178467, 4.015410423278809, 5.23257303237915, 6.449735641479492, 7.666898250579834, 8.884060859680176, 10.10122299194336, 11.31838607788086, 12.53554916381836, 13.752711296081543, 14.969873428344727, 16.187036514282227, 17.404199600219727, 18.621360778808594, 19.838523864746094, 21.055686950683594, 22.272850036621094, 23.490013122558594, 24.70717430114746, 25.92433738708496, 27.14150047302246, 28.358661651611328, 29.575824737548828, 30.792987823486328, 32.01015090942383, 33.22731399536133, 34.44447708129883, 35.66163635253906, 36.87879943847656, 38.09596252441406, 39.31312561035156, 40.53028869628906]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 12.0, 10.0, 17.0, 20.0, 21.0, 26.0, 28.0, 33.0, 49.0, 41.0, 47.0, 42.0, 54.0, 45.0, 45.0, 42.0, 44.0, 43.0, 40.0, 40.0, 27.0, 44.0, 23.0, 31.0, 21.0, 25.0, 15.0, 13.0, 15.0, 11.0, 9.0, 13.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.790283203125, -5.56494140625, -5.339599609375, -5.1142578125, -4.888916015625, -4.66357421875, -4.438232421875, -4.212890625, -3.987548828125, -3.76220703125, -3.536865234375, -3.3115234375, -3.086181640625, -2.86083984375, -2.635498046875, -2.41015625, -2.184814453125, -1.95947265625, -1.734130859375, -1.5087890625, -1.283447265625, -1.05810546875, -0.832763671875, -0.607421875, -0.382080078125, -0.15673828125, 0.068603515625, 0.2939453125, 0.519287109375, 0.74462890625, 0.969970703125, 1.1953125, 1.420654296875, 1.64599609375, 1.871337890625, 2.0966796875, 2.322021484375, 2.54736328125, 2.772705078125, 2.998046875, 3.223388671875, 3.44873046875, 3.674072265625, 3.8994140625, 4.124755859375, 4.35009765625, 4.575439453125, 4.80078125, 5.026123046875, 5.25146484375, 5.476806640625, 5.7021484375, 5.927490234375, 6.15283203125, 6.378173828125, 6.603515625, 6.828857421875, 7.05419921875, 7.279541015625, 7.5048828125, 7.730224609375, 7.95556640625, 8.180908203125, 8.40625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 18.0, 22.0, 51.0, 61.0, 74.0, 101.0, 172.0, 268.0, 400.0, 574.0, 934.0, 1418.0, 2021.0, 3301.0, 5314.0, 8177.0, 13258.0, 21158.0, 36297.0, 61375.0, 105485.0, 168471.0, 210565.0, 161880.0, 100259.0, 57931.0, 34395.0, 20320.0, 12428.0, 7862.0, 4960.0, 3126.0, 2036.0, 1295.0, 869.0, 526.0, 378.0, 242.0, 164.0, 114.0, 75.0, 62.0, 36.0, 19.0, 18.0, 14.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.671875, -0.6511688232421875, -0.630462646484375, -0.6097564697265625, -0.58905029296875, -0.5683441162109375, -0.547637939453125, -0.5269317626953125, -0.5062255859375, -0.4855194091796875, -0.464813232421875, -0.4441070556640625, -0.42340087890625, -0.4026947021484375, -0.381988525390625, -0.3612823486328125, -0.340576171875, -0.3198699951171875, -0.299163818359375, -0.2784576416015625, -0.25775146484375, -0.2370452880859375, -0.216339111328125, -0.1956329345703125, -0.1749267578125, -0.1542205810546875, -0.133514404296875, -0.1128082275390625, -0.09210205078125, -0.0713958740234375, -0.050689697265625, -0.0299835205078125, -0.00927734375, 0.0114288330078125, 0.032135009765625, 0.0528411865234375, 0.07354736328125, 0.0942535400390625, 0.114959716796875, 0.1356658935546875, 0.1563720703125, 0.1770782470703125, 0.197784423828125, 0.2184906005859375, 0.23919677734375, 0.2599029541015625, 0.280609130859375, 0.3013153076171875, 0.322021484375, 0.3427276611328125, 0.363433837890625, 0.3841400146484375, 0.40484619140625, 0.4255523681640625, 0.446258544921875, 0.4669647216796875, 0.4876708984375, 0.5083770751953125, 0.529083251953125, 0.5497894287109375, 0.57049560546875, 0.5912017822265625, 0.611907958984375, 0.6326141357421875, 0.6533203125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 7.0, 3.0, 6.0, 11.0, 8.0, 20.0, 13.0, 24.0, 19.0, 19.0, 19.0, 30.0, 40.0, 26.0, 41.0, 38.0, 44.0, 54.0, 48.0, 1066.0, 50.0, 48.0, 44.0, 35.0, 44.0, 31.0, 31.0, 24.0, 28.0, 30.0, 23.0, 21.0, 17.0, 9.0, 9.0, 9.0, 15.0, 4.0, 9.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.62109375, -4.475830078125, -4.33056640625, -4.185302734375, -4.0400390625, -3.894775390625, -3.74951171875, -3.604248046875, -3.458984375, -3.313720703125, -3.16845703125, -3.023193359375, -2.8779296875, -2.732666015625, -2.58740234375, -2.442138671875, -2.296875, -2.151611328125, -2.00634765625, -1.861083984375, -1.7158203125, -1.570556640625, -1.42529296875, -1.280029296875, -1.134765625, -0.989501953125, -0.84423828125, -0.698974609375, -0.5537109375, -0.408447265625, -0.26318359375, -0.117919921875, 0.02734375, 0.172607421875, 0.31787109375, 0.463134765625, 0.6083984375, 0.753662109375, 0.89892578125, 1.044189453125, 1.189453125, 1.334716796875, 1.47998046875, 1.625244140625, 1.7705078125, 1.915771484375, 2.06103515625, 2.206298828125, 2.3515625, 2.496826171875, 2.64208984375, 2.787353515625, 2.9326171875, 3.077880859375, 3.22314453125, 3.368408203125, 3.513671875, 3.658935546875, 3.80419921875, 3.949462890625, 4.0947265625, 4.239990234375, 4.38525390625, 4.530517578125, 4.67578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 10.0, 7.0, 10.0, 17.0, 19.0, 30.0, 53.0, 84.0, 106.0, 194.0, 286.0, 480.0, 770.0, 1167.0, 1929.0, 3120.0, 5204.0, 8387.0, 14107.0, 23947.0, 40967.0, 72757.0, 124250.0, 180960.0, 1243686.0, 151337.0, 94182.0, 53911.0, 30426.0, 17659.0, 10658.0, 6270.0, 3860.0, 2400.0, 1405.0, 924.0, 577.0, 357.0, 215.0, 121.0, 101.0, 69.0, 37.0, 31.0, 18.0, 11.0, 9.0, 2.0, 2.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49951171875, -0.482421875, -0.46533203125, -0.4482421875, -0.43115234375, -0.4140625, -0.39697265625, -0.3798828125, -0.36279296875, -0.345703125, -0.32861328125, -0.3115234375, -0.29443359375, -0.27734375, -0.26025390625, -0.2431640625, -0.22607421875, -0.208984375, -0.19189453125, -0.1748046875, -0.15771484375, -0.140625, -0.12353515625, -0.1064453125, -0.08935546875, -0.072265625, -0.05517578125, -0.0380859375, -0.02099609375, -0.00390625, 0.01318359375, 0.0302734375, 0.04736328125, 0.064453125, 0.08154296875, 0.0986328125, 0.11572265625, 0.1328125, 0.14990234375, 0.1669921875, 0.18408203125, 0.201171875, 0.21826171875, 0.2353515625, 0.25244140625, 0.26953125, 0.28662109375, 0.3037109375, 0.32080078125, 0.337890625, 0.35498046875, 0.3720703125, 0.38916015625, 0.40625, 0.42333984375, 0.4404296875, 0.45751953125, 0.474609375, 0.49169921875, 0.5087890625, 0.52587890625, 0.54296875, 0.56005859375, 0.5771484375, 0.59423828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 0.0, 5.0, 8.0, 11.0, 9.0, 13.0, 22.0, 15.0, 13.0, 27.0, 24.0, 37.0, 26.0, 39.0, 50.0, 38.0, 44.0, 51.0, 52.0, 60.0, 61.0, 47.0, 44.0, 45.0, 32.0, 29.0, 23.0, 35.0, 23.0, 19.0, 20.0, 13.0, 4.0, 9.0, 9.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0021762847900390625, -0.0021111667156219482, -0.002046048641204834, -0.0019809305667877197, -0.0019158124923706055, -0.0018506944179534912, -0.001785576343536377, -0.0017204582691192627, -0.0016553401947021484, -0.0015902221202850342, -0.00152510404586792, -0.0014599859714508057, -0.0013948678970336914, -0.0013297498226165771, -0.0012646317481994629, -0.0011995136737823486, -0.0011343955993652344, -0.0010692775249481201, -0.0010041594505310059, -0.0009390413761138916, -0.0008739233016967773, -0.0008088052272796631, -0.0007436871528625488, -0.0006785690784454346, -0.0006134510040283203, -0.0005483329296112061, -0.0004832148551940918, -0.00041809678077697754, -0.0003529787063598633, -0.000287860631942749, -0.00022274255752563477, -0.0001576244831085205, -9.250640869140625e-05, -2.7388334274291992e-05, 3.7729740142822266e-05, 0.00010284781455993652, 0.00016796588897705078, 0.00023308396339416504, 0.0002982020378112793, 0.00036332011222839355, 0.0004284381866455078, 0.0004935562610626221, 0.0005586743354797363, 0.0006237924098968506, 0.0006889104843139648, 0.0007540285587310791, 0.0008191466331481934, 0.0008842647075653076, 0.0009493827819824219, 0.0010145008563995361, 0.0010796189308166504, 0.0011447370052337646, 0.001209855079650879, 0.0012749731540679932, 0.0013400912284851074, 0.0014052093029022217, 0.001470327377319336, 0.0015354454517364502, 0.0016005635261535645, 0.0016656816005706787, 0.001730799674987793, 0.0017959177494049072, 0.0018610358238220215, 0.0019261538982391357, 0.00199127197265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 3.0, 8.0, 1.0, 19.0, 13.0, 12.0, 22.0, 27.0, 29.0, 36.0, 47.0, 57.0, 69.0, 84.0, 133.0, 199.0, 396.0, 1247.0, 106157.0, 935313.0, 3277.0, 566.0, 224.0, 152.0, 100.0, 67.0, 56.0, 50.0, 34.0, 28.0, 24.0, 23.0, 19.0, 10.0, 10.0, 7.0, 7.0, 5.0, 7.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042572021484375, -0.04116249084472656, -0.039752960205078125, -0.03834342956542969, -0.03693389892578125, -0.03552436828613281, -0.034114837646484375, -0.03270530700683594, -0.0312957763671875, -0.029886245727539062, -0.028476715087890625, -0.027067184448242188, -0.02565765380859375, -0.024248123168945312, -0.022838592529296875, -0.021429061889648438, -0.02001953125, -0.018610000610351562, -0.017200469970703125, -0.015790939331054688, -0.01438140869140625, -0.012971878051757812, -0.011562347412109375, -0.010152816772460938, -0.0087432861328125, -0.0073337554931640625, -0.005924224853515625, -0.0045146942138671875, -0.00310516357421875, -0.0016956329345703125, -0.000286102294921875, 0.0011234283447265625, 0.002532958984375, 0.0039424896240234375, 0.005352020263671875, 0.0067615509033203125, 0.00817108154296875, 0.009580612182617188, 0.010990142822265625, 0.012399673461914062, 0.0138092041015625, 0.015218734741210938, 0.016628265380859375, 0.018037796020507812, 0.01944732666015625, 0.020856857299804688, 0.022266387939453125, 0.023675918579101562, 0.02508544921875, 0.026494979858398438, 0.027904510498046875, 0.029314041137695312, 0.03072357177734375, 0.03213310241699219, 0.033542633056640625, 0.03495216369628906, 0.0363616943359375, 0.03777122497558594, 0.039180755615234375, 0.04059028625488281, 0.04199981689453125, 0.04340934753417969, 0.044818878173828125, 0.04622840881347656, 0.047637939453125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 182.0, 793.0, 41.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02585594728589058, -0.025371214374899864, -0.02488648146390915, -0.024401746690273285, -0.02391701377928257, -0.023432280868291855, -0.02294754795730114, -0.022462815046310425, -0.02197808027267456, -0.021493347361683846, -0.02100861445069313, -0.020523879677057266, -0.02003914676606655, -0.019554413855075836, -0.01906968094408512, -0.018584948033094406, -0.018100213259458542, -0.017615480348467827, -0.017130747437477112, -0.016646012663841248, -0.016161279752850533, -0.015676546841859818, -0.015191813930869102, -0.014707080088555813, -0.014222348108887672, -0.013737615197896957, -0.013252881355583668, -0.012768148444592953, -0.012283414602279663, -0.011798681691288948, -0.011313948780298233, -0.010829214937984943, -0.010344480164349079, -0.009859747253358364, -0.009375013411045074, -0.00889028050005436, -0.00840554665774107, -0.007920813746750355, -0.007436080370098352, -0.00695134699344635, -0.006466613616794348, -0.005981880240142345, -0.005497146863490343, -0.005012413486838341, -0.004527680575847626, -0.004042946733534336, -0.003558213822543621, -0.0030734804458916187, -0.0025887470692396164, -0.002104013692587614, -0.0016192804323509336, -0.001134547172114253, -0.0006498137954622507, -0.00016508041881024837, 0.0003196527250111103, 0.0008043861016631126, 0.001289119478315115, 0.0017738528549671173, 0.0022585862316191196, 0.0027433193754404783, 0.0032280527520924807, 0.003712786128744483, 0.004197519272565842, 0.004682252649217844, 0.005166986025869846]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 5.0, 6.0, 6.0, 4.0, 7.0, 10.0, 10.0, 14.0, 18.0, 13.0, 25.0, 25.0, 24.0, 27.0, 24.0, 38.0, 25.0, 36.0, 33.0, 38.0, 38.0, 34.0, 37.0, 38.0, 55.0, 37.0, 32.0, 33.0, 43.0, 25.0, 31.0, 24.0, 36.0, 18.0, 22.0, 16.0, 26.0, 11.0, 13.0, 11.0, 7.0, 7.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011115670204162598, -0.001074160449206829, -0.0010367538779973984, -0.0009993473067879677, -0.000961940735578537, -0.0009245341643691063, -0.0008871275931596756, -0.0008497210219502449, -0.0008123144507408142, -0.0007749078795313835, -0.0007375013083219528, -0.0007000947371125221, -0.0006626881659030914, -0.0006252815946936607, -0.00058787502348423, -0.0005504684522747993, -0.0005130618810653687, -0.00047565530985593796, -0.00043824873864650726, -0.00040084216743707657, -0.0003634355962276459, -0.0003260290250182152, -0.0002886224538087845, -0.0002512158825993538, -0.0002138093113899231, -0.0001764027401804924, -0.0001389961689710617, -0.00010158959776163101, -6.418302655220032e-05, -2.6776455342769623e-05, 1.0630115866661072e-05, 4.8036687076091766e-05, 8.544325828552246e-05, 0.00012284982949495316, 0.00016025640070438385, 0.00019766297191381454, 0.00023506954312324524, 0.00027247611433267593, 0.00030988268554210663, 0.0003472892567515373, 0.000384695827960968, 0.0004221023991703987, 0.0004595089703798294, 0.0004969155415892601, 0.0005343221127986908, 0.0005717286840081215, 0.0006091352552175522, 0.0006465418264269829, 0.0006839483976364136, 0.0007213549688458443, 0.000758761540055275, 0.0007961681112647057, 0.0008335746824741364, 0.000870981253683567, 0.0009083878248929977, 0.0009457943961024284, 0.0009832009673118591, 0.0010206075385212898, 0.0010580141097307205, 0.0010954206809401512, 0.001132827252149582, 0.0011702338233590126, 0.0012076403945684433, 0.001245046965777874, 0.0012824535369873047]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 12.0, 10.0, 17.0, 20.0, 21.0, 26.0, 28.0, 33.0, 49.0, 41.0, 47.0, 42.0, 54.0, 45.0, 45.0, 42.0, 44.0, 43.0, 40.0, 40.0, 27.0, 44.0, 23.0, 30.0, 22.0, 25.0, 15.0, 13.0, 15.0, 11.0, 9.0, 13.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.790283203125, -5.56494140625, -5.339599609375, -5.1142578125, -4.888916015625, -4.66357421875, -4.438232421875, -4.212890625, -3.987548828125, -3.76220703125, -3.536865234375, -3.3115234375, -3.086181640625, -2.86083984375, -2.635498046875, -2.41015625, -2.184814453125, -1.95947265625, -1.734130859375, -1.5087890625, -1.283447265625, -1.05810546875, -0.832763671875, -0.607421875, -0.382080078125, -0.15673828125, 0.068603515625, 0.2939453125, 0.519287109375, 0.74462890625, 0.969970703125, 1.1953125, 1.420654296875, 1.64599609375, 1.871337890625, 2.0966796875, 2.322021484375, 2.54736328125, 2.772705078125, 2.998046875, 3.223388671875, 3.44873046875, 3.674072265625, 3.8994140625, 4.124755859375, 4.35009765625, 4.575439453125, 4.80078125, 5.026123046875, 5.25146484375, 5.476806640625, 5.7021484375, 5.927490234375, 6.15283203125, 6.378173828125, 6.603515625, 6.828857421875, 7.05419921875, 7.279541015625, 7.5048828125, 7.730224609375, 7.95556640625, 8.180908203125, 8.40625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 11.0, 19.0, 20.0, 23.0, 24.0, 42.0, 68.0, 76.0, 93.0, 150.0, 231.0, 369.0, 693.0, 1752.0, 7802.0, 50992.0, 613109.0, 331673.0, 32864.0, 5533.0, 1381.0, 578.0, 312.0, 231.0, 117.0, 90.0, 68.0, 57.0, 43.0, 19.0, 25.0, 16.0, 18.0, 15.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.7113037109375, -10.297607421875, -9.8839111328125, -9.47021484375, -9.0565185546875, -8.642822265625, -8.2291259765625, -7.8154296875, -7.4017333984375, -6.988037109375, -6.5743408203125, -6.16064453125, -5.7469482421875, -5.333251953125, -4.9195556640625, -4.505859375, -4.0921630859375, -3.678466796875, -3.2647705078125, -2.85107421875, -2.4373779296875, -2.023681640625, -1.6099853515625, -1.1962890625, -0.7825927734375, -0.368896484375, 0.0447998046875, 0.45849609375, 0.8721923828125, 1.285888671875, 1.6995849609375, 2.11328125, 2.5269775390625, 2.940673828125, 3.3543701171875, 3.76806640625, 4.1817626953125, 4.595458984375, 5.0091552734375, 5.4228515625, 5.8365478515625, 6.250244140625, 6.6639404296875, 7.07763671875, 7.4913330078125, 7.905029296875, 8.3187255859375, 8.732421875, 9.1461181640625, 9.559814453125, 9.9735107421875, 10.38720703125, 10.8009033203125, 11.214599609375, 11.6282958984375, 12.0419921875, 12.4556884765625, 12.869384765625, 13.2830810546875, 13.69677734375, 14.1104736328125, 14.524169921875, 14.9378662109375, 15.3515625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 10.0, 5.0, 17.0, 12.0, 17.0, 24.0, 25.0, 29.0, 37.0, 38.0, 49.0, 45.0, 63.0, 96.0, 1690.0, 362.0, 91.0, 64.0, 62.0, 55.0, 42.0, 26.0, 39.0, 28.0, 35.0, 21.0, 9.0, 13.0, 8.0, 6.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.663818359375, -27.76513671875, -26.866455078125, -25.9677734375, -25.069091796875, -24.17041015625, -23.271728515625, -22.373046875, -21.474365234375, -20.57568359375, -19.677001953125, -18.7783203125, -17.879638671875, -16.98095703125, -16.082275390625, -15.18359375, -14.284912109375, -13.38623046875, -12.487548828125, -11.5888671875, -10.690185546875, -9.79150390625, -8.892822265625, -7.994140625, -7.095458984375, -6.19677734375, -5.298095703125, -4.3994140625, -3.500732421875, -2.60205078125, -1.703369140625, -0.8046875, 0.093994140625, 0.99267578125, 1.891357421875, 2.7900390625, 3.688720703125, 4.58740234375, 5.486083984375, 6.384765625, 7.283447265625, 8.18212890625, 9.080810546875, 9.9794921875, 10.878173828125, 11.77685546875, 12.675537109375, 13.57421875, 14.472900390625, 15.37158203125, 16.270263671875, 17.1689453125, 18.067626953125, 18.96630859375, 19.864990234375, 20.763671875, 21.662353515625, 22.56103515625, 23.459716796875, 24.3583984375, 25.257080078125, 26.15576171875, 27.054443359375, 27.953125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 9.0, 7.0, 12.0, 12.0, 19.0, 36.0, 39.0, 42.0, 36.0, 69.0, 102.0, 180.0, 377.0, 972.0, 209224.0, 2932270.0, 1332.0, 371.0, 180.0, 110.0, 69.0, 48.0, 37.0, 32.0, 27.0, 21.0, 13.0, 16.0, 9.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.75, -82.0244140625, -79.298828125, -76.5732421875, -73.84765625, -71.1220703125, -68.396484375, -65.6708984375, -62.9453125, -60.2197265625, -57.494140625, -54.7685546875, -52.04296875, -49.3173828125, -46.591796875, -43.8662109375, -41.140625, -38.4150390625, -35.689453125, -32.9638671875, -30.23828125, -27.5126953125, -24.787109375, -22.0615234375, -19.3359375, -16.6103515625, -13.884765625, -11.1591796875, -8.43359375, -5.7080078125, -2.982421875, -0.2568359375, 2.46875, 5.1943359375, 7.919921875, 10.6455078125, 13.37109375, 16.0966796875, 18.822265625, 21.5478515625, 24.2734375, 26.9990234375, 29.724609375, 32.4501953125, 35.17578125, 37.9013671875, 40.626953125, 43.3525390625, 46.078125, 48.8037109375, 51.529296875, 54.2548828125, 56.98046875, 59.7060546875, 62.431640625, 65.1572265625, 67.8828125, 70.6083984375, 73.333984375, 76.0595703125, 78.78515625, 81.5107421875, 84.236328125, 86.9619140625, 89.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 301.0, 645.0, 62.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.72957611083984, -75.79257202148438, -71.8555679321289, -67.91856384277344, -63.9815673828125, -60.04456329345703, -56.10755920410156, -52.170555114746094, -48.23355484008789, -44.29655075073242, -40.35955047607422, -36.42254638671875, -32.48554229736328, -28.548542022705078, -24.61153793334961, -20.674535751342773, -16.737533569335938, -12.800531387329102, -8.86352825164795, -4.926525115966797, -0.9895229339599609, 2.947479248046875, 6.884483337402344, 10.82148551940918, 14.758487701416016, 18.69548988342285, 22.632492065429688, 26.569496154785156, 30.506498336791992, 34.44350051879883, 38.3805046081543, 42.3175048828125, 46.25450134277344, 50.191505432128906, 54.12850570678711, 58.06550979614258, 62.00251007080078, 65.93951416015625, 69.87651824951172, 73.81352233886719, 77.75051879882812, 81.6875228881836, 85.62452697753906, 89.5615234375, 93.49852752685547, 97.43553161621094, 101.3725357055664, 105.30953979492188, 109.24654388427734, 113.18354797363281, 117.12055206298828, 121.05755615234375, 124.99455261230469, 128.93154907226562, 132.86856079101562, 136.80555725097656, 140.74256896972656, 144.6795654296875, 148.6165771484375, 152.55357360839844, 156.49058532714844, 160.42758178710938, 164.36459350585938, 168.3015899658203, 172.23858642578125]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 6.0, 1.0, 12.0, 8.0, 15.0, 13.0, 11.0, 23.0, 15.0, 16.0, 20.0, 16.0, 33.0, 31.0, 28.0, 45.0, 41.0, 38.0, 46.0, 36.0, 48.0, 40.0, 36.0, 40.0, 36.0, 43.0, 39.0, 35.0, 30.0, 26.0, 25.0, 21.0, 21.0, 20.0, 12.0, 11.0, 14.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-64.33148956298828, -62.33515167236328, -60.33881759643555, -58.34247970581055, -56.34614181518555, -54.34980773925781, -52.35346984863281, -50.35713195800781, -48.36079406738281, -46.36445617675781, -44.36812210083008, -42.37178421020508, -40.37544631958008, -38.379112243652344, -36.382774353027344, -34.386436462402344, -32.39010238647461, -30.393766403198242, -28.397428512573242, -26.401092529296875, -24.404754638671875, -22.408418655395508, -20.41208267211914, -18.41574478149414, -16.419408798217773, -14.42307186126709, -12.426734924316406, -10.430398941040039, -8.434062004089355, -6.437725067138672, -4.441389083862305, -2.445052146911621, -0.4487152099609375, 1.547621488571167, 3.5439581871032715, 5.540294647216797, 7.5366315841674805, 9.532968521118164, 11.529304504394531, 13.525641441345215, 15.521978378295898, 17.518314361572266, 19.514652252197266, 21.510988235473633, 23.50732421875, 25.503662109375, 27.499998092651367, 29.496334075927734, 31.492671966552734, 33.489009857177734, 35.48534393310547, 37.48168182373047, 39.47801971435547, 41.47435760498047, 43.4706916809082, 45.4670295715332, 47.46336364746094, 49.45970153808594, 51.45603561401367, 53.45237350463867, 55.44871139526367, 57.445045471191406, 59.441383361816406, 61.437721252441406, 63.434059143066406]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 13.0, 9.0, 6.0, 12.0, 22.0, 17.0, 24.0, 22.0, 34.0, 36.0, 43.0, 40.0, 46.0, 47.0, 67.0, 43.0, 38.0, 38.0, 43.0, 47.0, 49.0, 32.0, 46.0, 33.0, 28.0, 24.0, 18.0, 14.0, 23.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.50726318359375, -6.2606201171875, -6.01397705078125, -5.767333984375, -5.52069091796875, -5.2740478515625, -5.02740478515625, -4.78076171875, -4.53411865234375, -4.2874755859375, -4.04083251953125, -3.794189453125, -3.54754638671875, -3.3009033203125, -3.05426025390625, -2.8076171875, -2.56097412109375, -2.3143310546875, -2.06768798828125, -1.821044921875, -1.57440185546875, -1.3277587890625, -1.08111572265625, -0.83447265625, -0.58782958984375, -0.3411865234375, -0.09454345703125, 0.152099609375, 0.39874267578125, 0.6453857421875, 0.89202880859375, 1.138671875, 1.38531494140625, 1.6319580078125, 1.87860107421875, 2.125244140625, 2.37188720703125, 2.6185302734375, 2.86517333984375, 3.11181640625, 3.35845947265625, 3.6051025390625, 3.85174560546875, 4.098388671875, 4.34503173828125, 4.5916748046875, 4.83831787109375, 5.0849609375, 5.33160400390625, 5.5782470703125, 5.82489013671875, 6.071533203125, 6.31817626953125, 6.5648193359375, 6.81146240234375, 7.05810546875, 7.30474853515625, 7.5513916015625, 7.79803466796875, 8.044677734375, 8.29132080078125, 8.5379638671875, 8.78460693359375, 9.03125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 3.0, 10.0, 12.0, 10.0, 12.0, 29.0, 28.0, 38.0, 59.0, 71.0, 86.0, 141.0, 241.0, 430.0, 791.0, 1642.0, 4181.0, 13449.0, 54486.0, 276945.0, 1096710.0, 1739725.0, 783709.0, 172009.0, 34212.0, 9132.0, 3059.0, 1318.0, 673.0, 360.0, 219.0, 133.0, 94.0, 75.0, 54.0, 41.0, 24.0, 20.0, 13.0, 9.0, 7.0, 10.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5802001953125, -8.277587890625, -7.9749755859375, -7.67236328125, -7.3697509765625, -7.067138671875, -6.7645263671875, -6.4619140625, -6.1593017578125, -5.856689453125, -5.5540771484375, -5.25146484375, -4.9488525390625, -4.646240234375, -4.3436279296875, -4.041015625, -3.7384033203125, -3.435791015625, -3.1331787109375, -2.83056640625, -2.5279541015625, -2.225341796875, -1.9227294921875, -1.6201171875, -1.3175048828125, -1.014892578125, -0.7122802734375, -0.40966796875, -0.1070556640625, 0.195556640625, 0.4981689453125, 0.80078125, 1.1033935546875, 1.406005859375, 1.7086181640625, 2.01123046875, 2.3138427734375, 2.616455078125, 2.9190673828125, 3.2216796875, 3.5242919921875, 3.826904296875, 4.1295166015625, 4.43212890625, 4.7347412109375, 5.037353515625, 5.3399658203125, 5.642578125, 5.9451904296875, 6.247802734375, 6.5504150390625, 6.85302734375, 7.1556396484375, 7.458251953125, 7.7608642578125, 8.0634765625, 8.3660888671875, 8.668701171875, 8.9713134765625, 9.27392578125, 9.5765380859375, 9.879150390625, 10.1817626953125, 10.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 11.0, 6.0, 16.0, 9.0, 16.0, 19.0, 29.0, 39.0, 51.0, 50.0, 77.0, 103.0, 136.0, 158.0, 216.0, 237.0, 306.0, 351.0, 364.0, 372.0, 302.0, 255.0, 207.0, 157.0, 134.0, 93.0, 75.0, 65.0, 48.0, 37.0, 22.0, 26.0, 21.0, 15.0, 14.0, 6.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.3017578125, -9.962890625, -9.6240234375, -9.28515625, -8.9462890625, -8.607421875, -8.2685546875, -7.9296875, -7.5908203125, -7.251953125, -6.9130859375, -6.57421875, -6.2353515625, -5.896484375, -5.5576171875, -5.21875, -4.8798828125, -4.541015625, -4.2021484375, -3.86328125, -3.5244140625, -3.185546875, -2.8466796875, -2.5078125, -2.1689453125, -1.830078125, -1.4912109375, -1.15234375, -0.8134765625, -0.474609375, -0.1357421875, 0.203125, 0.5419921875, 0.880859375, 1.2197265625, 1.55859375, 1.8974609375, 2.236328125, 2.5751953125, 2.9140625, 3.2529296875, 3.591796875, 3.9306640625, 4.26953125, 4.6083984375, 4.947265625, 5.2861328125, 5.625, 5.9638671875, 6.302734375, 6.6416015625, 6.98046875, 7.3193359375, 7.658203125, 7.9970703125, 8.3359375, 8.6748046875, 9.013671875, 9.3525390625, 9.69140625, 10.0302734375, 10.369140625, 10.7080078125, 11.046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 7.0, 17.0, 25.0, 36.0, 41.0, 59.0, 69.0, 101.0, 106.0, 151.0, 196.0, 269.0, 412.0, 650.0, 1584.0, 8180.0, 284062.0, 3791264.0, 98890.0, 4994.0, 1185.0, 589.0, 349.0, 261.0, 203.0, 133.0, 102.0, 79.0, 55.0, 50.0, 31.0, 31.0, 19.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.28125, -40.9755859375, -39.669921875, -38.3642578125, -37.05859375, -35.7529296875, -34.447265625, -33.1416015625, -31.8359375, -30.5302734375, -29.224609375, -27.9189453125, -26.61328125, -25.3076171875, -24.001953125, -22.6962890625, -21.390625, -20.0849609375, -18.779296875, -17.4736328125, -16.16796875, -14.8623046875, -13.556640625, -12.2509765625, -10.9453125, -9.6396484375, -8.333984375, -7.0283203125, -5.72265625, -4.4169921875, -3.111328125, -1.8056640625, -0.5, 0.8056640625, 2.111328125, 3.4169921875, 4.72265625, 6.0283203125, 7.333984375, 8.6396484375, 9.9453125, 11.2509765625, 12.556640625, 13.8623046875, 15.16796875, 16.4736328125, 17.779296875, 19.0849609375, 20.390625, 21.6962890625, 23.001953125, 24.3076171875, 25.61328125, 26.9189453125, 28.224609375, 29.5302734375, 30.8359375, 32.1416015625, 33.447265625, 34.7529296875, 36.05859375, 37.3642578125, 38.669921875, 39.9755859375, 41.28125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 33.0, 653.0, 324.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.59719848632812, -202.88308715820312, -189.1689910888672, -175.4548797607422, -161.74078369140625, -148.02667236328125, -134.31256103515625, -120.59845733642578, -106.88435363769531, -93.17024993896484, -79.45614624023438, -65.74203491210938, -52.027931213378906, -38.31382751464844, -24.599716186523438, -10.885612487792969, 2.8284912109375, 16.5425968170166, 30.256702423095703, 43.97080993652344, 57.684913635253906, 71.39901733398438, 85.11312866210938, 98.82723236083984, 112.54133605957031, 126.25543975830078, 139.96954345703125, 153.68365478515625, 167.39776611328125, 181.1118621826172, 194.8259735107422, 208.54006958007812, 222.25421142578125, 235.96832275390625, 249.6824188232422, 263.39654541015625, 277.1106262207031, 290.8247375488281, 304.5388488769531, 318.2529602050781, 331.967041015625, 345.68115234375, 359.395263671875, 373.109375, 386.8234558105469, 400.5375671386719, 414.2516784667969, 427.9657897949219, 441.6799011230469, 455.3940124511719, 469.1081237792969, 482.82220458984375, 496.53631591796875, 510.25042724609375, 523.9645385742188, 537.6786499023438, 551.3927612304688, 565.1068725585938, 578.8209838867188, 592.5350952148438, 606.2492065429688, 619.9632568359375, 633.6773681640625, 647.3914794921875, 661.1055908203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 10.0, 8.0, 11.0, 20.0, 16.0, 13.0, 32.0, 31.0, 26.0, 38.0, 36.0, 43.0, 31.0, 31.0, 40.0, 48.0, 39.0, 47.0, 42.0, 37.0, 40.0, 40.0, 38.0, 37.0, 34.0, 28.0, 27.0, 33.0, 15.0, 18.0, 19.0, 11.0, 10.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.46484375, -45.00541687011719, -43.545989990234375, -42.08656311035156, -40.627140045166016, -39.1677131652832, -37.70828628540039, -36.24885940551758, -34.78943634033203, -33.33000946044922, -31.87058448791504, -30.411157608032227, -28.951732635498047, -27.492305755615234, -26.032878875732422, -24.57345199584961, -23.114025115966797, -21.654598236083984, -20.195173263549805, -18.735746383666992, -17.276321411132812, -15.81689453125, -14.357467651367188, -12.898041725158691, -11.438615798950195, -9.9791898727417, -8.519763946533203, -7.060337066650391, -5.6009111404418945, -4.141485214233398, -2.682058334350586, -1.2226324081420898, 0.23679351806640625, 1.6962196826934814, 3.1556458473205566, 4.615072250366211, 6.074498176574707, 7.533924102783203, 8.993350982666016, 10.452776908874512, 11.912202835083008, 13.371628761291504, 14.8310546875, 16.290481567382812, 17.749908447265625, 19.209333419799805, 20.668760299682617, 22.128185272216797, 23.58761215209961, 25.047039031982422, 26.5064640045166, 27.965890884399414, 29.425315856933594, 30.884742736816406, 32.34416961669922, 33.80359649658203, 35.263023376464844, 36.722450256347656, 38.18187713623047, 39.64130401611328, 41.10072708129883, 42.56015396118164, 44.01958084106445, 45.479007720947266, 46.93843078613281]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 6.0, 4.0, 10.0, 7.0, 16.0, 16.0, 16.0, 26.0, 23.0, 22.0, 26.0, 36.0, 38.0, 42.0, 36.0, 38.0, 34.0, 50.0, 45.0, 40.0, 39.0, 56.0, 37.0, 41.0, 30.0, 35.0, 32.0, 27.0, 25.0, 25.0, 18.0, 13.0, 24.0, 15.0, 10.0, 10.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.5003662109375, -5.274169921875, -5.0479736328125, -4.82177734375, -4.5955810546875, -4.369384765625, -4.1431884765625, -3.9169921875, -3.6907958984375, -3.464599609375, -3.2384033203125, -3.01220703125, -2.7860107421875, -2.559814453125, -2.3336181640625, -2.107421875, -1.8812255859375, -1.655029296875, -1.4288330078125, -1.20263671875, -0.9764404296875, -0.750244140625, -0.5240478515625, -0.2978515625, -0.0716552734375, 0.154541015625, 0.3807373046875, 0.60693359375, 0.8331298828125, 1.059326171875, 1.2855224609375, 1.51171875, 1.7379150390625, 1.964111328125, 2.1903076171875, 2.41650390625, 2.6427001953125, 2.868896484375, 3.0950927734375, 3.3212890625, 3.5474853515625, 3.773681640625, 3.9998779296875, 4.22607421875, 4.4522705078125, 4.678466796875, 4.9046630859375, 5.130859375, 5.3570556640625, 5.583251953125, 5.8094482421875, 6.03564453125, 6.2618408203125, 6.488037109375, 6.7142333984375, 6.9404296875, 7.1666259765625, 7.392822265625, 7.6190185546875, 7.84521484375, 8.0714111328125, 8.297607421875, 8.5238037109375, 8.75]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 12.0, 23.0, 22.0, 26.0, 58.0, 85.0, 129.0, 206.0, 325.0, 449.0, 706.0, 1072.0, 1676.0, 2563.0, 4139.0, 6613.0, 10863.0, 17681.0, 30513.0, 53833.0, 95654.0, 159567.0, 214839.0, 180435.0, 112505.0, 63993.0, 36039.0, 21010.0, 12751.0, 7570.0, 4723.0, 2979.0, 1973.0, 1262.0, 746.0, 494.0, 345.0, 245.0, 148.0, 89.0, 53.0, 48.0, 29.0, 25.0, 11.0, 13.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7123565673828125, -0.689849853515625, -0.6673431396484375, -0.64483642578125, -0.6223297119140625, -0.599822998046875, -0.5773162841796875, -0.5548095703125, -0.5323028564453125, -0.509796142578125, -0.4872894287109375, -0.46478271484375, -0.4422760009765625, -0.419769287109375, -0.3972625732421875, -0.374755859375, -0.3522491455078125, -0.329742431640625, -0.3072357177734375, -0.28472900390625, -0.2622222900390625, -0.239715576171875, -0.2172088623046875, -0.1947021484375, -0.1721954345703125, -0.149688720703125, -0.1271820068359375, -0.10467529296875, -0.0821685791015625, -0.059661865234375, -0.0371551513671875, -0.0146484375, 0.0078582763671875, 0.030364990234375, 0.0528717041015625, 0.07537841796875, 0.0978851318359375, 0.120391845703125, 0.1428985595703125, 0.1654052734375, 0.1879119873046875, 0.210418701171875, 0.2329254150390625, 0.25543212890625, 0.2779388427734375, 0.300445556640625, 0.3229522705078125, 0.345458984375, 0.3679656982421875, 0.390472412109375, 0.4129791259765625, 0.43548583984375, 0.4579925537109375, 0.480499267578125, 0.5030059814453125, 0.5255126953125, 0.5480194091796875, 0.570526123046875, 0.5930328369140625, 0.61553955078125, 0.6380462646484375, 0.660552978515625, 0.6830596923828125, 0.70556640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 3.0, 8.0, 6.0, 8.0, 7.0, 15.0, 13.0, 22.0, 25.0, 22.0, 19.0, 24.0, 24.0, 37.0, 23.0, 29.0, 27.0, 31.0, 40.0, 46.0, 47.0, 1057.0, 43.0, 30.0, 49.0, 36.0, 29.0, 33.0, 22.0, 26.0, 16.0, 16.0, 25.0, 27.0, 22.0, 14.0, 14.0, 14.0, 13.0, 14.0, 12.0, 8.0, 12.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.548919677734375, -3.42401123046875, -3.299102783203125, -3.1741943359375, -3.049285888671875, -2.92437744140625, -2.799468994140625, -2.674560546875, -2.549652099609375, -2.42474365234375, -2.299835205078125, -2.1749267578125, -2.050018310546875, -1.92510986328125, -1.800201416015625, -1.67529296875, -1.550384521484375, -1.42547607421875, -1.300567626953125, -1.1756591796875, -1.050750732421875, -0.92584228515625, -0.800933837890625, -0.676025390625, -0.551116943359375, -0.42620849609375, -0.301300048828125, -0.1763916015625, -0.051483154296875, 0.07342529296875, 0.198333740234375, 0.3232421875, 0.448150634765625, 0.57305908203125, 0.697967529296875, 0.8228759765625, 0.947784423828125, 1.07269287109375, 1.197601318359375, 1.322509765625, 1.447418212890625, 1.57232666015625, 1.697235107421875, 1.8221435546875, 1.947052001953125, 2.07196044921875, 2.196868896484375, 2.32177734375, 2.446685791015625, 2.57159423828125, 2.696502685546875, 2.8214111328125, 2.946319580078125, 3.07122802734375, 3.196136474609375, 3.321044921875, 3.445953369140625, 3.57086181640625, 3.695770263671875, 3.8206787109375, 3.945587158203125, 4.07049560546875, 4.195404052734375, 4.3203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 13.0, 8.0, 13.0, 20.0, 30.0, 53.0, 67.0, 105.0, 151.0, 246.0, 387.0, 580.0, 926.0, 1494.0, 2436.0, 3777.0, 6408.0, 10459.0, 17803.0, 29360.0, 49761.0, 83978.0, 133937.0, 705676.0, 707085.0, 133901.0, 84462.0, 49728.0, 29329.0, 17530.0, 10634.0, 6394.0, 3798.0, 2377.0, 1533.0, 960.0, 658.0, 352.0, 224.0, 160.0, 98.0, 82.0, 46.0, 35.0, 15.0, 19.0, 10.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5478515625, -0.530731201171875, -0.51361083984375, -0.496490478515625, -0.4793701171875, -0.462249755859375, -0.44512939453125, -0.428009033203125, -0.410888671875, -0.393768310546875, -0.37664794921875, -0.359527587890625, -0.3424072265625, -0.325286865234375, -0.30816650390625, -0.291046142578125, -0.27392578125, -0.256805419921875, -0.23968505859375, -0.222564697265625, -0.2054443359375, -0.188323974609375, -0.17120361328125, -0.154083251953125, -0.136962890625, -0.119842529296875, -0.10272216796875, -0.085601806640625, -0.0684814453125, -0.051361083984375, -0.03424072265625, -0.017120361328125, 0.0, 0.017120361328125, 0.03424072265625, 0.051361083984375, 0.0684814453125, 0.085601806640625, 0.10272216796875, 0.119842529296875, 0.136962890625, 0.154083251953125, 0.17120361328125, 0.188323974609375, 0.2054443359375, 0.222564697265625, 0.23968505859375, 0.256805419921875, 0.27392578125, 0.291046142578125, 0.30816650390625, 0.325286865234375, 0.3424072265625, 0.359527587890625, 0.37664794921875, 0.393768310546875, 0.410888671875, 0.428009033203125, 0.44512939453125, 0.462249755859375, 0.4793701171875, 0.496490478515625, 0.51361083984375, 0.530731201171875, 0.5478515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 6.0, 14.0, 13.0, 15.0, 28.0, 19.0, 28.0, 33.0, 27.0, 37.0, 41.0, 42.0, 59.0, 49.0, 72.0, 51.0, 48.0, 56.0, 55.0, 47.0, 40.0, 35.0, 23.0, 29.0, 19.0, 21.0, 18.0, 19.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0020427703857421875, -0.0019805431365966797, -0.0019183158874511719, -0.001856088638305664, -0.0017938613891601562, -0.0017316341400146484, -0.0016694068908691406, -0.0016071796417236328, -0.001544952392578125, -0.0014827251434326172, -0.0014204978942871094, -0.0013582706451416016, -0.0012960433959960938, -0.001233816146850586, -0.0011715888977050781, -0.0011093616485595703, -0.0010471343994140625, -0.0009849071502685547, -0.0009226799011230469, -0.0008604526519775391, -0.0007982254028320312, -0.0007359981536865234, -0.0006737709045410156, -0.0006115436553955078, -0.00054931640625, -0.0004870891571044922, -0.0004248619079589844, -0.00036263465881347656, -0.00030040740966796875, -0.00023818016052246094, -0.00017595291137695312, -0.00011372566223144531, -5.14984130859375e-05, 1.0728836059570312e-05, 7.295608520507812e-05, 0.00013518333435058594, 0.00019741058349609375, 0.00025963783264160156, 0.0003218650817871094, 0.0003840923309326172, 0.000446319580078125, 0.0005085468292236328, 0.0005707740783691406, 0.0006330013275146484, 0.0006952285766601562, 0.0007574558258056641, 0.0008196830749511719, 0.0008819103240966797, 0.0009441375732421875, 0.0010063648223876953, 0.0010685920715332031, 0.001130819320678711, 0.0011930465698242188, 0.0012552738189697266, 0.0013175010681152344, 0.0013797283172607422, 0.00144195556640625, 0.0015041828155517578, 0.0015664100646972656, 0.0016286373138427734, 0.0016908645629882812, 0.001753091812133789, 0.0018153190612792969, 0.0018775463104248047, 0.0019397735595703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 6.0, 9.0, 8.0, 13.0, 18.0, 23.0, 22.0, 36.0, 43.0, 45.0, 70.0, 96.0, 108.0, 145.0, 297.0, 700.0, 8399.0, 1027585.0, 9316.0, 677.0, 299.0, 157.0, 104.0, 71.0, 66.0, 39.0, 44.0, 34.0, 25.0, 19.0, 19.0, 10.0, 14.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.041107177734375, -0.03980255126953125, -0.0384979248046875, -0.03719329833984375, -0.035888671875, -0.03458404541015625, -0.0332794189453125, -0.03197479248046875, -0.030670166015625, -0.02936553955078125, -0.0280609130859375, -0.02675628662109375, -0.02545166015625, -0.02414703369140625, -0.0228424072265625, -0.02153778076171875, -0.020233154296875, -0.01892852783203125, -0.0176239013671875, -0.01631927490234375, -0.0150146484375, -0.01371002197265625, -0.0124053955078125, -0.01110076904296875, -0.009796142578125, -0.00849151611328125, -0.0071868896484375, -0.00588226318359375, -0.00457763671875, -0.00327301025390625, -0.0019683837890625, -0.00066375732421875, 0.000640869140625, 0.00194549560546875, 0.0032501220703125, 0.00455474853515625, 0.005859375, 0.00716400146484375, 0.0084686279296875, 0.00977325439453125, 0.011077880859375, 0.01238250732421875, 0.0136871337890625, 0.01499176025390625, 0.01629638671875, 0.01760101318359375, 0.0189056396484375, 0.02021026611328125, 0.021514892578125, 0.02281951904296875, 0.0241241455078125, 0.02542877197265625, 0.0267333984375, 0.02803802490234375, 0.0293426513671875, 0.03064727783203125, 0.031951904296875, 0.03325653076171875, 0.0345611572265625, 0.03586578369140625, 0.03717041015625, 0.03847503662109375, 0.0397796630859375, 0.04108428955078125, 0.042388916015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 81.0, 933.0, 3.0], "bins": [-0.04052910581231117, -0.039878811687231064, -0.039228521287441254, -0.038578227162361145, -0.037927933037281036, -0.03727763891220093, -0.03662734851241112, -0.03597705438733101, -0.0353267602622509, -0.03467646613717079, -0.03402617573738098, -0.03337588161230087, -0.032725587487220764, -0.032075293362140656, -0.031425002962350845, -0.030774708837270737, -0.030124416574835777, -0.029474124312400818, -0.02882383018732071, -0.02817353792488575, -0.02752324379980564, -0.026872951537370682, -0.026222657412290573, -0.025572365149855614, -0.024922072887420654, -0.024271780624985695, -0.023621486499905586, -0.022971194237470627, -0.022320900112390518, -0.02167060784995556, -0.02102031372487545, -0.02037002146244049, -0.019719725474715233, -0.019069433212280273, -0.018419139087200165, -0.017768846824765205, -0.017118552699685097, -0.016468260437250137, -0.01581796631217003, -0.01516767404973507, -0.01451738178730011, -0.013867088593542576, -0.013216795399785042, -0.012566502206027508, -0.011916209012269974, -0.011265916749835014, -0.01061562355607748, -0.009965330362319946, -0.009315037168562412, -0.008664743974804878, -0.008014450781047344, -0.0073641580529510975, -0.0067138648591935635, -0.0060635716654360294, -0.005413278937339783, -0.004762985743582249, -0.004112692084163427, -0.0034623988904058933, -0.002812105929479003, -0.0021618129685521126, -0.0015115197747945786, -0.0008612265810370445, -0.00021093362011015415, 0.0004393593408167362, 0.0010896524181589484]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 21.0, 17.0, 22.0, 30.0, 35.0, 39.0, 38.0, 44.0, 47.0, 50.0, 57.0, 50.0, 64.0, 57.0, 45.0, 60.0, 49.0, 38.0, 28.0, 38.0, 33.0, 22.0, 18.0, 12.0, 14.0, 7.0, 9.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010290741920471191, -0.0009841816499829292, -0.0009392891079187393, -0.0008943965658545494, -0.0008495040237903595, -0.0008046114817261696, -0.0007597189396619797, -0.0007148263975977898, -0.0006699338555335999, -0.0006250413134694099, -0.00058014877140522, -0.0005352562293410301, -0.0004903636872768402, -0.0004454711452126503, -0.0004005786031484604, -0.0003556860610842705, -0.00031079351902008057, -0.00026590097695589066, -0.00022100843489170074, -0.00017611589282751083, -0.00013122335076332092, -8.633080869913101e-05, -4.14382666349411e-05, 3.45427542924881e-06, 4.834681749343872e-05, 9.323935955762863e-05, 0.00013813190162181854, 0.00018302444368600845, 0.00022791698575019836, 0.0002728095278143883, 0.0003177020698785782, 0.0003625946119427681, 0.000407487154006958, 0.0004523796960711479, 0.0004972722381353378, 0.0005421647801995277, 0.0005870573222637177, 0.0006319498643279076, 0.0006768424063920975, 0.0007217349484562874, 0.0007666274905204773, 0.0008115200325846672, 0.0008564125746488571, 0.000901305116713047, 0.0009461976587772369, 0.0009910902008414268, 0.0010359827429056168, 0.0010808752849698067, 0.0011257678270339966, 0.0011706603690981865, 0.0012155529111623764, 0.0012604454532265663, 0.0013053379952907562, 0.0013502305373549461, 0.001395123079419136, 0.001440015621483326, 0.0014849081635475159, 0.0015298007056117058, 0.0015746932476758957, 0.0016195857897400856, 0.0016644783318042755, 0.0017093708738684654, 0.0017542634159326553, 0.0017991559579968452, 0.0018440485000610352]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 6.0, 4.0, 10.0, 7.0, 16.0, 16.0, 16.0, 26.0, 23.0, 22.0, 26.0, 36.0, 38.0, 42.0, 36.0, 38.0, 34.0, 50.0, 45.0, 40.0, 39.0, 56.0, 37.0, 41.0, 30.0, 35.0, 32.0, 27.0, 25.0, 25.0, 18.0, 13.0, 24.0, 15.0, 10.0, 10.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.5003662109375, -5.274169921875, -5.0479736328125, -4.82177734375, -4.5955810546875, -4.369384765625, -4.1431884765625, -3.9169921875, -3.6907958984375, -3.464599609375, -3.2384033203125, -3.01220703125, -2.7860107421875, -2.559814453125, -2.3336181640625, -2.107421875, -1.8812255859375, -1.655029296875, -1.4288330078125, -1.20263671875, -0.9764404296875, -0.750244140625, -0.5240478515625, -0.2978515625, -0.0716552734375, 0.154541015625, 0.3807373046875, 0.60693359375, 0.8331298828125, 1.059326171875, 1.2855224609375, 1.51171875, 1.7379150390625, 1.964111328125, 2.1903076171875, 2.41650390625, 2.6427001953125, 2.868896484375, 3.0950927734375, 3.3212890625, 3.5474853515625, 3.773681640625, 3.9998779296875, 4.22607421875, 4.4522705078125, 4.678466796875, 4.9046630859375, 5.130859375, 5.3570556640625, 5.583251953125, 5.8094482421875, 6.03564453125, 6.2618408203125, 6.488037109375, 6.7142333984375, 6.9404296875, 7.1666259765625, 7.392822265625, 7.6190185546875, 7.84521484375, 8.0714111328125, 8.297607421875, 8.5238037109375, 8.75]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 7.0, 10.0, 17.0, 23.0, 33.0, 42.0, 71.0, 104.0, 187.0, 385.0, 792.0, 1730.0, 3687.0, 8240.0, 19321.0, 48010.0, 126838.0, 359294.0, 306131.0, 103758.0, 40123.0, 16592.0, 7082.0, 3063.0, 1468.0, 695.0, 356.0, 163.0, 105.0, 55.0, 35.0, 33.0, 25.0, 20.0, 16.0, 4.0, 9.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.30645751953125, -5.0933837890625, -4.88031005859375, -4.667236328125, -4.45416259765625, -4.2410888671875, -4.02801513671875, -3.81494140625, -3.60186767578125, -3.3887939453125, -3.17572021484375, -2.962646484375, -2.74957275390625, -2.5364990234375, -2.32342529296875, -2.1103515625, -1.89727783203125, -1.6842041015625, -1.47113037109375, -1.258056640625, -1.04498291015625, -0.8319091796875, -0.61883544921875, -0.40576171875, -0.19268798828125, 0.0203857421875, 0.23345947265625, 0.446533203125, 0.65960693359375, 0.8726806640625, 1.08575439453125, 1.298828125, 1.51190185546875, 1.7249755859375, 1.93804931640625, 2.151123046875, 2.36419677734375, 2.5772705078125, 2.79034423828125, 3.00341796875, 3.21649169921875, 3.4295654296875, 3.64263916015625, 3.855712890625, 4.06878662109375, 4.2818603515625, 4.49493408203125, 4.7080078125, 4.92108154296875, 5.1341552734375, 5.34722900390625, 5.560302734375, 5.77337646484375, 5.9864501953125, 6.19952392578125, 6.41259765625, 6.62567138671875, 6.8387451171875, 7.05181884765625, 7.264892578125, 7.47796630859375, 7.6910400390625, 7.90411376953125, 8.1171875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 11.0, 17.0, 15.0, 16.0, 18.0, 15.0, 30.0, 32.0, 28.0, 42.0, 29.0, 41.0, 58.0, 55.0, 95.0, 354.0, 1555.0, 146.0, 75.0, 48.0, 42.0, 35.0, 32.0, 27.0, 25.0, 29.0, 19.0, 21.0, 26.0, 15.0, 13.0, 8.0, 9.0, 11.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.945068359375, -20.20263671875, -19.460205078125, -18.7177734375, -17.975341796875, -17.23291015625, -16.490478515625, -15.748046875, -15.005615234375, -14.26318359375, -13.520751953125, -12.7783203125, -12.035888671875, -11.29345703125, -10.551025390625, -9.80859375, -9.066162109375, -8.32373046875, -7.581298828125, -6.8388671875, -6.096435546875, -5.35400390625, -4.611572265625, -3.869140625, -3.126708984375, -2.38427734375, -1.641845703125, -0.8994140625, -0.156982421875, 0.58544921875, 1.327880859375, 2.0703125, 2.812744140625, 3.55517578125, 4.297607421875, 5.0400390625, 5.782470703125, 6.52490234375, 7.267333984375, 8.009765625, 8.752197265625, 9.49462890625, 10.237060546875, 10.9794921875, 11.721923828125, 12.46435546875, 13.206787109375, 13.94921875, 14.691650390625, 15.43408203125, 16.176513671875, 16.9189453125, 17.661376953125, 18.40380859375, 19.146240234375, 19.888671875, 20.631103515625, 21.37353515625, 22.115966796875, 22.8583984375, 23.600830078125, 24.34326171875, 25.085693359375, 25.828125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 12.0, 11.0, 13.0, 11.0, 17.0, 11.0, 25.0, 40.0, 58.0, 36.0, 70.0, 89.0, 98.0, 139.0, 206.0, 317.0, 572.0, 2041.0, 55736.0, 3009269.0, 72689.0, 2437.0, 594.0, 342.0, 204.0, 133.0, 99.0, 99.0, 75.0, 53.0, 44.0, 24.0, 29.0, 24.0, 16.0, 12.0, 14.0, 11.0, 7.0, 5.0, 4.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-42.78125, -41.5771484375, -40.373046875, -39.1689453125, -37.96484375, -36.7607421875, -35.556640625, -34.3525390625, -33.1484375, -31.9443359375, -30.740234375, -29.5361328125, -28.33203125, -27.1279296875, -25.923828125, -24.7197265625, -23.515625, -22.3115234375, -21.107421875, -19.9033203125, -18.69921875, -17.4951171875, -16.291015625, -15.0869140625, -13.8828125, -12.6787109375, -11.474609375, -10.2705078125, -9.06640625, -7.8623046875, -6.658203125, -5.4541015625, -4.25, -3.0458984375, -1.841796875, -0.6376953125, 0.56640625, 1.7705078125, 2.974609375, 4.1787109375, 5.3828125, 6.5869140625, 7.791015625, 8.9951171875, 10.19921875, 11.4033203125, 12.607421875, 13.8115234375, 15.015625, 16.2197265625, 17.423828125, 18.6279296875, 19.83203125, 21.0361328125, 22.240234375, 23.4443359375, 24.6484375, 25.8525390625, 27.056640625, 28.2607421875, 29.46484375, 30.6689453125, 31.873046875, 33.0771484375, 34.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 26.0, 101.0, 260.0, 353.0, 207.0, 49.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6065902709961, -62.23388671875, -59.861183166503906, -57.48847579956055, -55.11577224731445, -52.74306869506836, -50.370361328125, -47.997657775878906, -45.62495422363281, -43.25225067138672, -40.879547119140625, -38.506839752197266, -36.13413619995117, -33.76143264770508, -31.38872718811035, -29.016021728515625, -26.64331817626953, -24.270614624023438, -21.89790916442871, -19.525203704833984, -17.15250015258789, -14.77979564666748, -12.40709114074707, -10.034385681152344, -7.66168212890625, -5.28897762298584, -2.9162731170654297, -0.5435686111450195, 1.8291358947753906, 4.201840400695801, 6.574544906616211, 8.947250366210938, 11.319953918457031, 13.692658424377441, 16.06536293029785, 18.438068389892578, 20.810771942138672, 23.183475494384766, 25.556180953979492, 27.92888641357422, 30.301589965820312, 32.674293518066406, 35.0469970703125, 37.41970443725586, 39.79240798950195, 42.16511154174805, 44.537818908691406, 46.9105224609375, 49.283226013183594, 51.65592956542969, 54.02863311767578, 56.40134048461914, 58.774044036865234, 61.14674758911133, 63.51945495605469, 65.89215850830078, 68.26486206054688, 70.63756561279297, 73.01026916503906, 75.38297271728516, 77.75567626953125, 80.12838745117188, 82.50109100341797, 84.87379455566406, 87.24649810791016]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 9.0, 3.0, 7.0, 8.0, 12.0, 13.0, 12.0, 14.0, 16.0, 22.0, 34.0, 28.0, 33.0, 25.0, 29.0, 31.0, 36.0, 42.0, 32.0, 42.0, 50.0, 49.0, 54.0, 38.0, 34.0, 38.0, 33.0, 29.0, 23.0, 29.0, 27.0, 23.0, 13.0, 12.0, 21.0, 15.0, 15.0, 9.0, 8.0, 5.0, 10.0, 4.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.220550537109375, -52.39317321777344, -50.5657958984375, -48.73841857910156, -46.911041259765625, -45.08366394042969, -43.25628662109375, -41.42890930175781, -39.601531982421875, -37.77415466308594, -35.94677734375, -34.11940002441406, -32.292022705078125, -30.464645385742188, -28.63726806640625, -26.809890747070312, -24.982513427734375, -23.155136108398438, -21.3277587890625, -19.500381469726562, -17.673004150390625, -15.845626831054688, -14.01824951171875, -12.190872192382812, -10.363494873046875, -8.536117553710938, -6.708740234375, -4.8813629150390625, -3.053985595703125, -1.2266082763671875, 0.60076904296875, 2.4281463623046875, 4.255523681640625, 6.0829010009765625, 7.9102783203125, 9.737655639648438, 11.565032958984375, 13.392410278320312, 15.21978759765625, 17.047164916992188, 18.874542236328125, 20.701919555664062, 22.529296875, 24.356674194335938, 26.184051513671875, 28.011428833007812, 29.83880615234375, 31.666183471679688, 33.493560791015625, 35.32093811035156, 37.1483154296875, 38.97569274902344, 40.803070068359375, 42.63044738769531, 44.45782470703125, 46.28520202636719, 48.112579345703125, 49.93995666503906, 51.767333984375, 53.59471130371094, 55.422088623046875, 57.24946594238281, 59.07684326171875, 60.90422058105469, 62.731597900390625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 0.0, 5.0, 7.0, 10.0, 13.0, 10.0, 19.0, 17.0, 13.0, 21.0, 21.0, 28.0, 29.0, 24.0, 35.0, 35.0, 37.0, 44.0, 41.0, 34.0, 45.0, 41.0, 44.0, 29.0, 45.0, 40.0, 32.0, 41.0, 27.0, 31.0, 22.0, 21.0, 19.0, 17.0, 16.0, 13.0, 14.0, 15.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.96685791015625, -5.7501220703125, -5.53338623046875, -5.316650390625, -5.09991455078125, -4.8831787109375, -4.66644287109375, -4.44970703125, -4.23297119140625, -4.0162353515625, -3.79949951171875, -3.582763671875, -3.36602783203125, -3.1492919921875, -2.93255615234375, -2.7158203125, -2.49908447265625, -2.2823486328125, -2.06561279296875, -1.848876953125, -1.63214111328125, -1.4154052734375, -1.19866943359375, -0.98193359375, -0.76519775390625, -0.5484619140625, -0.33172607421875, -0.114990234375, 0.10174560546875, 0.3184814453125, 0.53521728515625, 0.751953125, 0.96868896484375, 1.1854248046875, 1.40216064453125, 1.618896484375, 1.83563232421875, 2.0523681640625, 2.26910400390625, 2.48583984375, 2.70257568359375, 2.9193115234375, 3.13604736328125, 3.352783203125, 3.56951904296875, 3.7862548828125, 4.00299072265625, 4.2197265625, 4.43646240234375, 4.6531982421875, 4.86993408203125, 5.086669921875, 5.30340576171875, 5.5201416015625, 5.73687744140625, 5.95361328125, 6.17034912109375, 6.3870849609375, 6.60382080078125, 6.820556640625, 7.03729248046875, 7.2540283203125, 7.47076416015625, 7.6875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 7.0, 7.0, 14.0, 14.0, 20.0, 28.0, 24.0, 37.0, 48.0, 60.0, 74.0, 113.0, 205.0, 529.0, 2011.0, 13904.0, 263128.0, 3124957.0, 754130.0, 30108.0, 3364.0, 747.0, 236.0, 113.0, 68.0, 62.0, 52.0, 33.0, 35.0, 27.0, 13.0, 21.0, 14.0, 12.0, 9.0, 8.0, 13.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.640625, -17.966552734375, -17.29248046875, -16.618408203125, -15.9443359375, -15.270263671875, -14.59619140625, -13.922119140625, -13.248046875, -12.573974609375, -11.89990234375, -11.225830078125, -10.5517578125, -9.877685546875, -9.20361328125, -8.529541015625, -7.85546875, -7.181396484375, -6.50732421875, -5.833251953125, -5.1591796875, -4.485107421875, -3.81103515625, -3.136962890625, -2.462890625, -1.788818359375, -1.11474609375, -0.440673828125, 0.2333984375, 0.907470703125, 1.58154296875, 2.255615234375, 2.9296875, 3.603759765625, 4.27783203125, 4.951904296875, 5.6259765625, 6.300048828125, 6.97412109375, 7.648193359375, 8.322265625, 8.996337890625, 9.67041015625, 10.344482421875, 11.0185546875, 11.692626953125, 12.36669921875, 13.040771484375, 13.71484375, 14.388916015625, 15.06298828125, 15.737060546875, 16.4111328125, 17.085205078125, 17.75927734375, 18.433349609375, 19.107421875, 19.781494140625, 20.45556640625, 21.129638671875, 21.8037109375, 22.477783203125, 23.15185546875, 23.825927734375, 24.5]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 4.0, 7.0, 4.0, 14.0, 14.0, 13.0, 20.0, 45.0, 63.0, 69.0, 121.0, 152.0, 210.0, 302.0, 444.0, 513.0, 508.0, 434.0, 348.0, 229.0, 175.0, 128.0, 90.0, 55.0, 32.0, 21.0, 17.0, 8.0, 9.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.9046630859375, -16.449951171875, -15.9952392578125, -15.54052734375, -15.0858154296875, -14.631103515625, -14.1763916015625, -13.7216796875, -13.2669677734375, -12.812255859375, -12.3575439453125, -11.90283203125, -11.4481201171875, -10.993408203125, -10.5386962890625, -10.083984375, -9.6292724609375, -9.174560546875, -8.7198486328125, -8.26513671875, -7.8104248046875, -7.355712890625, -6.9010009765625, -6.4462890625, -5.9915771484375, -5.536865234375, -5.0821533203125, -4.62744140625, -4.1727294921875, -3.718017578125, -3.2633056640625, -2.80859375, -2.3538818359375, -1.899169921875, -1.4444580078125, -0.98974609375, -0.5350341796875, -0.080322265625, 0.3743896484375, 0.8291015625, 1.2838134765625, 1.738525390625, 2.1932373046875, 2.64794921875, 3.1026611328125, 3.557373046875, 4.0120849609375, 4.466796875, 4.9215087890625, 5.376220703125, 5.8309326171875, 6.28564453125, 6.7403564453125, 7.195068359375, 7.6497802734375, 8.1044921875, 8.5592041015625, 9.013916015625, 9.4686279296875, 9.92333984375, 10.3780517578125, 10.832763671875, 11.2874755859375, 11.7421875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 15.0, 14.0, 24.0, 34.0, 43.0, 70.0, 103.0, 108.0, 163.0, 236.0, 390.0, 1060.0, 7882.0, 501194.0, 3648209.0, 30850.0, 2257.0, 564.0, 284.0, 213.0, 152.0, 106.0, 80.0, 50.0, 46.0, 32.0, 27.0, 16.0, 9.0, 9.0, 11.0, 7.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.84375, -49.103515625, -47.36328125, -45.623046875, -43.8828125, -42.142578125, -40.40234375, -38.662109375, -36.921875, -35.181640625, -33.44140625, -31.701171875, -29.9609375, -28.220703125, -26.48046875, -24.740234375, -23.0, -21.259765625, -19.51953125, -17.779296875, -16.0390625, -14.298828125, -12.55859375, -10.818359375, -9.078125, -7.337890625, -5.59765625, -3.857421875, -2.1171875, -0.376953125, 1.36328125, 3.103515625, 4.84375, 6.583984375, 8.32421875, 10.064453125, 11.8046875, 13.544921875, 15.28515625, 17.025390625, 18.765625, 20.505859375, 22.24609375, 23.986328125, 25.7265625, 27.466796875, 29.20703125, 30.947265625, 32.6875, 34.427734375, 36.16796875, 37.908203125, 39.6484375, 41.388671875, 43.12890625, 44.869140625, 46.609375, 48.349609375, 50.08984375, 51.830078125, 53.5703125, 55.310546875, 57.05078125, 58.791015625, 60.53125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 35.0, 103.0, 265.0, 325.0, 182.0, 58.0, 30.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.02708053588867, -42.880699157714844, -38.73431396484375, -34.58793258666992, -30.44154930114746, -26.295166015625, -22.148784637451172, -18.00240135192871, -13.85601806640625, -9.709634780883789, -5.5632524490356445, -1.4168701171875, 2.729513168334961, 6.875896453857422, 11.02227783203125, 15.168661117553711, 19.315044403076172, 23.461427688598633, 27.607810974121094, 31.754192352294922, 35.90057373046875, 40.046958923339844, 44.19334030151367, 48.3397216796875, 52.486106872558594, 56.63248825073242, 60.778873443603516, 64.92525482177734, 69.07164001464844, 73.218017578125, 77.3644027709961, 81.51078796386719, 85.65716552734375, 89.80355072021484, 93.9499282836914, 98.0963134765625, 102.2426986694336, 106.38908386230469, 110.53546142578125, 114.68184661865234, 118.82823181152344, 122.97461700439453, 127.1209945678711, 131.2673797607422, 135.41375732421875, 139.56015014648438, 143.70652770996094, 147.8529052734375, 151.99929809570312, 156.1456756591797, 160.2920684814453, 164.43844604492188, 168.58482360839844, 172.73121643066406, 176.87759399414062, 181.0239715576172, 185.17034912109375, 189.3167266845703, 193.46311950683594, 197.6094970703125, 201.75587463378906, 205.9022674560547, 210.04864501953125, 214.1950225830078, 218.34141540527344]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 8.0, 13.0, 16.0, 19.0, 13.0, 26.0, 22.0, 15.0, 36.0, 32.0, 31.0, 42.0, 41.0, 42.0, 44.0, 51.0, 44.0, 47.0, 42.0, 42.0, 39.0, 31.0, 37.0, 29.0, 31.0, 31.0, 29.0, 19.0, 14.0, 28.0, 9.0, 12.0, 11.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0], "bins": [-52.600250244140625, -51.14336013793945, -49.68647003173828, -48.229583740234375, -46.7726936340332, -45.31580352783203, -43.85891342163086, -42.40202331542969, -40.94513702392578, -39.48824691772461, -38.03135681152344, -36.57447052001953, -35.11758041381836, -33.66069030761719, -32.203800201416016, -30.746910095214844, -29.290019989013672, -27.8331298828125, -26.37624168395996, -24.91935157775879, -23.46246337890625, -22.005573272705078, -20.548683166503906, -19.091793060302734, -17.634904861450195, -16.178014755249023, -14.721126556396484, -13.264236450195312, -11.807347297668457, -10.350458145141602, -8.89356803894043, -7.436678886413574, -5.979789733886719, -4.522900581359863, -3.0660109519958496, -1.609121322631836, -0.15223217010498047, 1.304656982421875, 2.761547088623047, 4.218436241149902, 5.675325393676758, 7.132214546203613, 8.589103698730469, 10.04599380493164, 11.502882957458496, 12.959772109985352, 14.416662216186523, 15.873551368713379, 17.330440521240234, 18.787330627441406, 20.244218826293945, 21.701108932495117, 23.157997131347656, 24.614887237548828, 26.07177734375, 27.528667449951172, 28.98555564880371, 30.442445755004883, 31.899333953857422, 33.356224060058594, 34.813114166259766, 36.27000427246094, 37.726890563964844, 39.183780670166016, 40.64067077636719]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 14.0, 6.0, 19.0, 19.0, 22.0, 30.0, 23.0, 28.0, 35.0, 34.0, 28.0, 43.0, 44.0, 45.0, 50.0, 34.0, 39.0, 51.0, 45.0, 42.0, 36.0, 38.0, 25.0, 36.0, 22.0, 17.0, 27.0, 17.0, 20.0, 13.0, 16.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.67919921875, -5.4521484375, -5.22509765625, -4.998046875, -4.77099609375, -4.5439453125, -4.31689453125, -4.08984375, -3.86279296875, -3.6357421875, -3.40869140625, -3.181640625, -2.95458984375, -2.7275390625, -2.50048828125, -2.2734375, -2.04638671875, -1.8193359375, -1.59228515625, -1.365234375, -1.13818359375, -0.9111328125, -0.68408203125, -0.45703125, -0.22998046875, -0.0029296875, 0.22412109375, 0.451171875, 0.67822265625, 0.9052734375, 1.13232421875, 1.359375, 1.58642578125, 1.8134765625, 2.04052734375, 2.267578125, 2.49462890625, 2.7216796875, 2.94873046875, 3.17578125, 3.40283203125, 3.6298828125, 3.85693359375, 4.083984375, 4.31103515625, 4.5380859375, 4.76513671875, 4.9921875, 5.21923828125, 5.4462890625, 5.67333984375, 5.900390625, 6.12744140625, 6.3544921875, 6.58154296875, 6.80859375, 7.03564453125, 7.2626953125, 7.48974609375, 7.716796875, 7.94384765625, 8.1708984375, 8.39794921875, 8.625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 8.0, 19.0, 12.0, 31.0, 47.0, 52.0, 93.0, 155.0, 229.0, 383.0, 573.0, 940.0, 1468.0, 2466.0, 3911.0, 6358.0, 10199.0, 17185.0, 28968.0, 51658.0, 92597.0, 159173.0, 219792.0, 185749.0, 113812.0, 64163.0, 35810.0, 20633.0, 12248.0, 7546.0, 4582.0, 2901.0, 1728.0, 1153.0, 698.0, 445.0, 246.0, 156.0, 123.0, 71.0, 49.0, 36.0, 27.0, 18.0, 9.0, 9.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7831649780273438, -0.7592010498046875, -0.7352371215820312, -0.711273193359375, -0.6873092651367188, -0.6633453369140625, -0.6393814086914062, -0.61541748046875, -0.5914535522460938, -0.5674896240234375, -0.5435256958007812, -0.519561767578125, -0.49559783935546875, -0.4716339111328125, -0.44766998291015625, -0.4237060546875, -0.39974212646484375, -0.3757781982421875, -0.35181427001953125, -0.327850341796875, -0.30388641357421875, -0.2799224853515625, -0.25595855712890625, -0.23199462890625, -0.20803070068359375, -0.1840667724609375, -0.16010284423828125, -0.136138916015625, -0.11217498779296875, -0.0882110595703125, -0.06424713134765625, -0.040283203125, -0.01631927490234375, 0.0076446533203125, 0.03160858154296875, 0.055572509765625, 0.07953643798828125, 0.1035003662109375, 0.12746429443359375, 0.15142822265625, 0.17539215087890625, 0.1993560791015625, 0.22332000732421875, 0.247283935546875, 0.27124786376953125, 0.2952117919921875, 0.31917572021484375, 0.3431396484375, 0.36710357666015625, 0.3910675048828125, 0.41503143310546875, 0.438995361328125, 0.46295928955078125, 0.4869232177734375, 0.5108871459960938, 0.53485107421875, 0.5588150024414062, 0.5827789306640625, 0.6067428588867188, 0.630706787109375, 0.6546707153320312, 0.6786346435546875, 0.7025985717773438, 0.7265625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 8.0, 9.0, 8.0, 8.0, 10.0, 19.0, 19.0, 16.0, 20.0, 35.0, 24.0, 28.0, 29.0, 30.0, 32.0, 39.0, 46.0, 38.0, 36.0, 1069.0, 44.0, 47.0, 32.0, 41.0, 37.0, 35.0, 33.0, 30.0, 27.0, 22.0, 17.0, 24.0, 17.0, 16.0, 13.0, 11.0, 12.0, 8.0, 4.0, 0.0, 10.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.928466796875, -3.79443359375, -3.660400390625, -3.5263671875, -3.392333984375, -3.25830078125, -3.124267578125, -2.990234375, -2.856201171875, -2.72216796875, -2.588134765625, -2.4541015625, -2.320068359375, -2.18603515625, -2.052001953125, -1.91796875, -1.783935546875, -1.64990234375, -1.515869140625, -1.3818359375, -1.247802734375, -1.11376953125, -0.979736328125, -0.845703125, -0.711669921875, -0.57763671875, -0.443603515625, -0.3095703125, -0.175537109375, -0.04150390625, 0.092529296875, 0.2265625, 0.360595703125, 0.49462890625, 0.628662109375, 0.7626953125, 0.896728515625, 1.03076171875, 1.164794921875, 1.298828125, 1.432861328125, 1.56689453125, 1.700927734375, 1.8349609375, 1.968994140625, 2.10302734375, 2.237060546875, 2.37109375, 2.505126953125, 2.63916015625, 2.773193359375, 2.9072265625, 3.041259765625, 3.17529296875, 3.309326171875, 3.443359375, 3.577392578125, 3.71142578125, 3.845458984375, 3.9794921875, 4.113525390625, 4.24755859375, 4.381591796875, 4.515625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 7.0, 11.0, 17.0, 29.0, 45.0, 85.0, 108.0, 184.0, 287.0, 457.0, 728.0, 1139.0, 1902.0, 3311.0, 5415.0, 9505.0, 15895.0, 28452.0, 50556.0, 89947.0, 149172.0, 1247166.0, 188347.0, 129085.0, 75740.0, 42388.0, 23697.0, 13713.0, 7901.0, 4721.0, 2794.0, 1665.0, 1051.0, 605.0, 385.0, 217.0, 142.0, 87.0, 61.0, 41.0, 18.0, 15.0, 15.0, 5.0, 10.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65625, -0.6362686157226562, -0.6162872314453125, -0.5963058471679688, -0.576324462890625, -0.5563430786132812, -0.5363616943359375, -0.5163803100585938, -0.49639892578125, -0.47641754150390625, -0.4564361572265625, -0.43645477294921875, -0.416473388671875, -0.39649200439453125, -0.3765106201171875, -0.35652923583984375, -0.3365478515625, -0.31656646728515625, -0.2965850830078125, -0.27660369873046875, -0.256622314453125, -0.23664093017578125, -0.2166595458984375, -0.19667816162109375, -0.17669677734375, -0.15671539306640625, -0.1367340087890625, -0.11675262451171875, -0.096771240234375, -0.07678985595703125, -0.0568084716796875, -0.03682708740234375, -0.016845703125, 0.00313568115234375, 0.0231170654296875, 0.04309844970703125, 0.063079833984375, 0.08306121826171875, 0.1030426025390625, 0.12302398681640625, 0.14300537109375, 0.16298675537109375, 0.1829681396484375, 0.20294952392578125, 0.222930908203125, 0.24291229248046875, 0.2628936767578125, 0.28287506103515625, 0.3028564453125, 0.32283782958984375, 0.3428192138671875, 0.36280059814453125, 0.382781982421875, 0.40276336669921875, 0.4227447509765625, 0.44272613525390625, 0.46270751953125, 0.48268890380859375, 0.5026702880859375, 0.5226516723632812, 0.542633056640625, 0.5626144409179688, 0.5825958251953125, 0.6025772094726562, 0.62255859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 10.0, 15.0, 14.0, 25.0, 12.0, 27.0, 38.0, 39.0, 36.0, 44.0, 66.0, 60.0, 69.0, 55.0, 60.0, 60.0, 51.0, 48.0, 40.0, 43.0, 33.0, 27.0, 15.0, 26.0, 13.0, 13.0, 4.0, 5.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024585723876953125, -0.0023823678493499756, -0.0023061633110046387, -0.0022299587726593018, -0.002153754234313965, -0.002077549695968628, -0.002001345157623291, -0.001925140619277954, -0.0018489360809326172, -0.0017727315425872803, -0.0016965270042419434, -0.0016203224658966064, -0.0015441179275512695, -0.0014679133892059326, -0.0013917088508605957, -0.0013155043125152588, -0.0012392997741699219, -0.001163095235824585, -0.001086890697479248, -0.0010106861591339111, -0.0009344816207885742, -0.0008582770824432373, -0.0007820725440979004, -0.0007058680057525635, -0.0006296634674072266, -0.0005534589290618896, -0.00047725439071655273, -0.0004010498523712158, -0.0003248453140258789, -0.000248640775680542, -0.00017243623733520508, -9.623169898986816e-05, -2.002716064453125e-05, 5.6177377700805664e-05, 0.00013238191604614258, 0.0002085864543914795, 0.0002847909927368164, 0.0003609955310821533, 0.00043720006942749023, 0.0005134046077728271, 0.0005896091461181641, 0.000665813684463501, 0.0007420182228088379, 0.0008182227611541748, 0.0008944272994995117, 0.0009706318378448486, 0.0010468363761901855, 0.0011230409145355225, 0.0011992454528808594, 0.0012754499912261963, 0.0013516545295715332, 0.0014278590679168701, 0.001504063606262207, 0.001580268144607544, 0.0016564726829528809, 0.0017326772212982178, 0.0018088817596435547, 0.0018850862979888916, 0.0019612908363342285, 0.0020374953746795654, 0.0021136999130249023, 0.0021899044513702393, 0.002266108989715576, 0.002342313528060913, 0.00241851806640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 4.0, 10.0, 6.0, 11.0, 13.0, 19.0, 25.0, 29.0, 36.0, 43.0, 61.0, 74.0, 105.0, 151.0, 241.0, 444.0, 1569.0, 355416.0, 686915.0, 2077.0, 464.0, 238.0, 141.0, 100.0, 82.0, 50.0, 51.0, 41.0, 24.0, 24.0, 12.0, 18.0, 13.0, 10.0, 3.0, 0.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043853759765625, -0.04239463806152344, -0.040935516357421875, -0.03947639465332031, -0.03801727294921875, -0.03655815124511719, -0.035099029541015625, -0.03363990783691406, -0.0321807861328125, -0.030721664428710938, -0.029262542724609375, -0.027803421020507812, -0.02634429931640625, -0.024885177612304688, -0.023426055908203125, -0.021966934204101562, -0.0205078125, -0.019048690795898438, -0.017589569091796875, -0.016130447387695312, -0.01467132568359375, -0.013212203979492188, -0.011753082275390625, -0.010293960571289062, -0.0088348388671875, -0.0073757171630859375, -0.005916595458984375, -0.0044574737548828125, -0.00299835205078125, -0.0015392303466796875, -8.0108642578125e-05, 0.0013790130615234375, 0.002838134765625, 0.0042972564697265625, 0.005756378173828125, 0.0072154998779296875, 0.00867462158203125, 0.010133743286132812, 0.011592864990234375, 0.013051986694335938, 0.0145111083984375, 0.015970230102539062, 0.017429351806640625, 0.018888473510742188, 0.02034759521484375, 0.021806716918945312, 0.023265838623046875, 0.024724960327148438, 0.02618408203125, 0.027643203735351562, 0.029102325439453125, 0.030561447143554688, 0.03202056884765625, 0.03347969055175781, 0.034938812255859375, 0.03639793395996094, 0.0378570556640625, 0.03931617736816406, 0.040775299072265625, 0.04223442077636719, 0.04369354248046875, 0.04515266418457031, 0.046611785888671875, 0.04807090759277344, 0.049530029296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 213.0, 798.0, 5.0], "bins": [-0.04439961910247803, -0.04368560016155243, -0.04297157749533653, -0.042257558554410934, -0.041543539613485336, -0.04082952067255974, -0.04011549800634384, -0.03940147906541824, -0.038687460124492645, -0.03797344118356705, -0.03725941851735115, -0.03654539957642555, -0.035831380635499954, -0.035117361694574356, -0.03440333902835846, -0.03368932008743286, -0.03297530114650726, -0.032261282205581665, -0.03154725953936577, -0.03083324059844017, -0.030119221657514572, -0.029405200853943825, -0.028691181913018227, -0.02797716110944748, -0.027263140305876732, -0.026549119502305984, -0.025835100561380386, -0.02512107975780964, -0.02440706081688404, -0.023693040013313293, -0.022979021072387695, -0.022265000268816948, -0.02155098132789135, -0.020836960524320602, -0.020122941583395004, -0.019408920779824257, -0.01869490183889866, -0.01798088103532791, -0.017266862094402313, -0.016552841290831566, -0.015838822349905968, -0.015124802477657795, -0.014410782605409622, -0.01369676273316145, -0.012982742860913277, -0.012268722988665104, -0.011554703116416931, -0.010840682312846184, -0.010126662440598011, -0.009412642568349838, -0.008698622696101665, -0.007984602823853493, -0.00727058295160532, -0.006556563079357147, -0.005842542741447687, -0.005128522869199514, -0.004414502531290054, -0.0037004826590418816, -0.002986462786793709, -0.0022724426817148924, -0.0015584228094667196, -0.0008444029372185469, -0.00013038283213973045, 0.0005836370401084423, 0.0012976567959412932]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 27.0, 15.0, 22.0, 20.0, 20.0, 37.0, 31.0, 38.0, 39.0, 42.0, 42.0, 62.0, 63.0, 53.0, 57.0, 42.0, 54.0, 43.0, 48.0, 32.0, 38.0, 34.0, 24.0, 23.0, 23.0, 19.0, 14.0, 4.0, 8.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012828707695007324, -0.001228678971529007, -0.0011744871735572815, -0.001120295375585556, -0.0010661035776138306, -0.001011911779642105, -0.0009577199816703796, -0.0009035281836986542, -0.0008493363857269287, -0.0007951445877552032, -0.0007409527897834778, -0.0006867609918117523, -0.0006325691938400269, -0.0005783773958683014, -0.0005241855978965759, -0.00046999379992485046, -0.000415802001953125, -0.00036161020398139954, -0.00030741840600967407, -0.0002532266080379486, -0.00019903481006622314, -0.00014484301209449768, -9.065121412277222e-05, -3.645941615104675e-05, 1.773238182067871e-05, 7.192417979240417e-05, 0.00012611597776412964, 0.0001803077757358551, 0.00023449957370758057, 0.00028869137167930603, 0.0003428831696510315, 0.00039707496762275696, 0.0004512667655944824, 0.0005054585635662079, 0.0005596503615379333, 0.0006138421595096588, 0.0006680339574813843, 0.0007222257554531097, 0.0007764175534248352, 0.0008306093513965607, 0.0008848011493682861, 0.0009389929473400116, 0.000993184745311737, 0.0010473765432834625, 0.001101568341255188, 0.0011557601392269135, 0.001209951937198639, 0.0012641437351703644, 0.0013183355331420898, 0.0013725273311138153, 0.0014267191290855408, 0.0014809109270572662, 0.0015351027250289917, 0.0015892945230007172, 0.0016434863209724426, 0.001697678118944168, 0.0017518699169158936, 0.001806061714887619, 0.0018602535128593445, 0.00191444531083107, 0.0019686371088027954, 0.002022828906774521, 0.0020770207047462463, 0.002131212502717972, 0.0021854043006896973]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 14.0, 6.0, 19.0, 19.0, 22.0, 30.0, 23.0, 28.0, 35.0, 34.0, 28.0, 44.0, 43.0, 45.0, 50.0, 34.0, 39.0, 51.0, 45.0, 42.0, 36.0, 38.0, 25.0, 36.0, 22.0, 17.0, 27.0, 17.0, 20.0, 13.0, 16.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.67919921875, -5.4521484375, -5.22509765625, -4.998046875, -4.77099609375, -4.5439453125, -4.31689453125, -4.08984375, -3.86279296875, -3.6357421875, -3.40869140625, -3.181640625, -2.95458984375, -2.7275390625, -2.50048828125, -2.2734375, -2.04638671875, -1.8193359375, -1.59228515625, -1.365234375, -1.13818359375, -0.9111328125, -0.68408203125, -0.45703125, -0.22998046875, -0.0029296875, 0.22412109375, 0.451171875, 0.67822265625, 0.9052734375, 1.13232421875, 1.359375, 1.58642578125, 1.8134765625, 2.04052734375, 2.267578125, 2.49462890625, 2.7216796875, 2.94873046875, 3.17578125, 3.40283203125, 3.6298828125, 3.85693359375, 4.083984375, 4.31103515625, 4.5380859375, 4.76513671875, 4.9921875, 5.21923828125, 5.4462890625, 5.67333984375, 5.900390625, 6.12744140625, 6.3544921875, 6.58154296875, 6.80859375, 7.03564453125, 7.2626953125, 7.48974609375, 7.716796875, 7.94384765625, 8.1708984375, 8.39794921875, 8.625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 9.0, 7.0, 15.0, 15.0, 15.0, 27.0, 36.0, 39.0, 69.0, 63.0, 97.0, 149.0, 188.0, 295.0, 580.0, 1715.0, 7404.0, 51257.0, 535983.0, 401552.0, 40016.0, 6077.0, 1405.0, 528.0, 281.0, 184.0, 152.0, 102.0, 51.0, 55.0, 40.0, 34.0, 23.0, 22.0, 13.0, 12.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.1392822265625, -10.692626953125, -10.2459716796875, -9.79931640625, -9.3526611328125, -8.906005859375, -8.4593505859375, -8.0126953125, -7.5660400390625, -7.119384765625, -6.6727294921875, -6.22607421875, -5.7794189453125, -5.332763671875, -4.8861083984375, -4.439453125, -3.9927978515625, -3.546142578125, -3.0994873046875, -2.65283203125, -2.2061767578125, -1.759521484375, -1.3128662109375, -0.8662109375, -0.4195556640625, 0.027099609375, 0.4737548828125, 0.92041015625, 1.3670654296875, 1.813720703125, 2.2603759765625, 2.70703125, 3.1536865234375, 3.600341796875, 4.0469970703125, 4.49365234375, 4.9403076171875, 5.386962890625, 5.8336181640625, 6.2802734375, 6.7269287109375, 7.173583984375, 7.6202392578125, 8.06689453125, 8.5135498046875, 8.960205078125, 9.4068603515625, 9.853515625, 10.3001708984375, 10.746826171875, 11.1934814453125, 11.64013671875, 12.0867919921875, 12.533447265625, 12.9801025390625, 13.4267578125, 13.8734130859375, 14.320068359375, 14.7667236328125, 15.21337890625, 15.6600341796875, 16.106689453125, 16.5533447265625, 17.0]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 17.0, 9.0, 12.0, 29.0, 22.0, 24.0, 25.0, 32.0, 54.0, 52.0, 34.0, 69.0, 121.0, 412.0, 1548.0, 135.0, 66.0, 56.0, 42.0, 50.0, 41.0, 31.0, 31.0, 21.0, 27.0, 10.0, 12.0, 11.0, 8.0, 9.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.734375, -28.88720703125, -28.0400390625, -27.19287109375, -26.345703125, -25.49853515625, -24.6513671875, -23.80419921875, -22.95703125, -22.10986328125, -21.2626953125, -20.41552734375, -19.568359375, -18.72119140625, -17.8740234375, -17.02685546875, -16.1796875, -15.33251953125, -14.4853515625, -13.63818359375, -12.791015625, -11.94384765625, -11.0966796875, -10.24951171875, -9.40234375, -8.55517578125, -7.7080078125, -6.86083984375, -6.013671875, -5.16650390625, -4.3193359375, -3.47216796875, -2.625, -1.77783203125, -0.9306640625, -0.08349609375, 0.763671875, 1.61083984375, 2.4580078125, 3.30517578125, 4.15234375, 4.99951171875, 5.8466796875, 6.69384765625, 7.541015625, 8.38818359375, 9.2353515625, 10.08251953125, 10.9296875, 11.77685546875, 12.6240234375, 13.47119140625, 14.318359375, 15.16552734375, 16.0126953125, 16.85986328125, 17.70703125, 18.55419921875, 19.4013671875, 20.24853515625, 21.095703125, 21.94287109375, 22.7900390625, 23.63720703125, 24.484375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 10.0, 10.0, 12.0, 11.0, 13.0, 12.0, 30.0, 37.0, 34.0, 60.0, 90.0, 105.0, 181.0, 360.0, 929.0, 16013.0, 3109074.0, 16727.0, 1005.0, 360.0, 165.0, 143.0, 75.0, 60.0, 34.0, 36.0, 25.0, 28.0, 9.0, 16.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.75, -52.8291015625, -50.908203125, -48.9873046875, -47.06640625, -45.1455078125, -43.224609375, -41.3037109375, -39.3828125, -37.4619140625, -35.541015625, -33.6201171875, -31.69921875, -29.7783203125, -27.857421875, -25.9365234375, -24.015625, -22.0947265625, -20.173828125, -18.2529296875, -16.33203125, -14.4111328125, -12.490234375, -10.5693359375, -8.6484375, -6.7275390625, -4.806640625, -2.8857421875, -0.96484375, 0.9560546875, 2.876953125, 4.7978515625, 6.71875, 8.6396484375, 10.560546875, 12.4814453125, 14.40234375, 16.3232421875, 18.244140625, 20.1650390625, 22.0859375, 24.0068359375, 25.927734375, 27.8486328125, 29.76953125, 31.6904296875, 33.611328125, 35.5322265625, 37.453125, 39.3740234375, 41.294921875, 43.2158203125, 45.13671875, 47.0576171875, 48.978515625, 50.8994140625, 52.8203125, 54.7412109375, 56.662109375, 58.5830078125, 60.50390625, 62.4248046875, 64.345703125, 66.2666015625, 68.1875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 50.0, 128.0, 271.0, 330.0, 147.0, 67.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.9830551147461, -87.17090606689453, -85.3587646484375, -83.54661560058594, -81.73446655273438, -79.92231750488281, -78.11016845703125, -76.29802703857422, -74.48587799072266, -72.6737289428711, -70.86158752441406, -69.0494384765625, -67.23728942871094, -65.42514038085938, -63.61299514770508, -61.80084991455078, -59.98870086669922, -58.176551818847656, -56.36440658569336, -54.55226135253906, -52.7401123046875, -50.92796325683594, -49.11581802368164, -47.303672790527344, -45.49152374267578, -43.67937469482422, -41.86722946166992, -40.055084228515625, -38.24293518066406, -36.4307861328125, -34.6186408996582, -32.806495666503906, -30.99434471130371, -29.18219757080078, -27.37005043029785, -25.557903289794922, -23.745756149291992, -21.933609008789062, -20.121461868286133, -18.309314727783203, -16.497167587280273, -14.685020446777344, -12.872873306274414, -11.060726165771484, -9.248579025268555, -7.436431884765625, -5.624284744262695, -3.8121376037597656, -1.999990463256836, -0.18784332275390625, 1.6243038177490234, 3.436450958251953, 5.248598098754883, 7.0607452392578125, 8.872892379760742, 10.685039520263672, 12.497186660766602, 14.309333801269531, 16.12148094177246, 17.93362808227539, 19.74577522277832, 21.55792236328125, 23.37006950378418, 25.18221664428711, 26.99436378479004]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 9.0, 7.0, 6.0, 10.0, 12.0, 11.0, 13.0, 32.0, 26.0, 27.0, 28.0, 23.0, 31.0, 27.0, 50.0, 39.0, 40.0, 38.0, 50.0, 48.0, 40.0, 42.0, 40.0, 44.0, 37.0, 37.0, 34.0, 33.0, 23.0, 23.0, 21.0, 17.0, 8.0, 4.0, 11.0, 10.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.07486343383789, -51.349910736083984, -49.624961853027344, -47.90000915527344, -46.17505645751953, -44.450103759765625, -42.72515106201172, -41.00020217895508, -39.27524948120117, -37.550296783447266, -35.825347900390625, -34.10039520263672, -32.37544250488281, -30.650489807128906, -28.925539016723633, -27.20058822631836, -25.475635528564453, -23.750682830810547, -22.025732040405273, -20.30078125, -18.575828552246094, -16.850875854492188, -15.125925064086914, -13.400973320007324, -11.676021575927734, -9.951069831848145, -8.226118087768555, -6.501166343688965, -4.776214599609375, -3.051262855529785, -1.3263111114501953, 0.39864063262939453, 2.1235885620117188, 3.8485403060913086, 5.573492050170898, 7.298443794250488, 9.023395538330078, 10.748347282409668, 12.473299026489258, 14.198250770568848, 15.923202514648438, 17.648155212402344, 19.373106002807617, 21.09805679321289, 22.823009490966797, 24.547962188720703, 26.272912979125977, 27.99786376953125, 29.722816467285156, 31.447769165039062, 33.17272186279297, 34.89767074584961, 36.622623443603516, 38.34757614135742, 40.07252502441406, 41.79747772216797, 43.522430419921875, 45.24738311767578, 46.97233581542969, 48.69728469848633, 50.422237396240234, 52.14719009399414, 53.87213897705078, 55.59709167480469, 57.322044372558594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 11.0, 6.0, 12.0, 12.0, 25.0, 13.0, 22.0, 27.0, 23.0, 34.0, 29.0, 30.0, 22.0, 36.0, 52.0, 51.0, 34.0, 44.0, 35.0, 32.0, 55.0, 41.0, 36.0, 29.0, 28.0, 27.0, 24.0, 31.0, 20.0, 22.0, 25.0, 14.0, 12.0, 11.0, 12.0, 8.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.92938232421875, -5.7103271484375, -5.49127197265625, -5.272216796875, -5.05316162109375, -4.8341064453125, -4.61505126953125, -4.39599609375, -4.17694091796875, -3.9578857421875, -3.73883056640625, -3.519775390625, -3.30072021484375, -3.0816650390625, -2.86260986328125, -2.6435546875, -2.42449951171875, -2.2054443359375, -1.98638916015625, -1.767333984375, -1.54827880859375, -1.3292236328125, -1.11016845703125, -0.89111328125, -0.67205810546875, -0.4530029296875, -0.23394775390625, -0.014892578125, 0.20416259765625, 0.4232177734375, 0.64227294921875, 0.861328125, 1.08038330078125, 1.2994384765625, 1.51849365234375, 1.737548828125, 1.95660400390625, 2.1756591796875, 2.39471435546875, 2.61376953125, 2.83282470703125, 3.0518798828125, 3.27093505859375, 3.489990234375, 3.70904541015625, 3.9281005859375, 4.14715576171875, 4.3662109375, 4.58526611328125, 4.8043212890625, 5.02337646484375, 5.242431640625, 5.46148681640625, 5.6805419921875, 5.89959716796875, 6.11865234375, 6.33770751953125, 6.5567626953125, 6.77581787109375, 6.994873046875, 7.21392822265625, 7.4329833984375, 7.65203857421875, 7.87109375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 7.0, 11.0, 10.0, 12.0, 10.0, 13.0, 17.0, 28.0, 21.0, 34.0, 46.0, 68.0, 112.0, 187.0, 349.0, 758.0, 1833.0, 5411.0, 22313.0, 174529.0, 1666558.0, 2043763.0, 239519.0, 28119.0, 6404.0, 2155.0, 926.0, 420.0, 200.0, 107.0, 75.0, 48.0, 40.0, 31.0, 24.0, 16.0, 19.0, 13.0, 11.0, 11.0, 13.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-14.4453125, -13.9483642578125, -13.451416015625, -12.9544677734375, -12.45751953125, -11.9605712890625, -11.463623046875, -10.9666748046875, -10.4697265625, -9.9727783203125, -9.475830078125, -8.9788818359375, -8.48193359375, -7.9849853515625, -7.488037109375, -6.9910888671875, -6.494140625, -5.9971923828125, -5.500244140625, -5.0032958984375, -4.50634765625, -4.0093994140625, -3.512451171875, -3.0155029296875, -2.5185546875, -2.0216064453125, -1.524658203125, -1.0277099609375, -0.53076171875, -0.0338134765625, 0.463134765625, 0.9600830078125, 1.45703125, 1.9539794921875, 2.450927734375, 2.9478759765625, 3.44482421875, 3.9417724609375, 4.438720703125, 4.9356689453125, 5.4326171875, 5.9295654296875, 6.426513671875, 6.9234619140625, 7.42041015625, 7.9173583984375, 8.414306640625, 8.9112548828125, 9.408203125, 9.9051513671875, 10.402099609375, 10.8990478515625, 11.39599609375, 11.8929443359375, 12.389892578125, 12.8868408203125, 13.3837890625, 13.8807373046875, 14.377685546875, 14.8746337890625, 15.37158203125, 15.8685302734375, 16.365478515625, 16.8624267578125, 17.359375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 8.0, 8.0, 10.0, 13.0, 19.0, 18.0, 19.0, 31.0, 47.0, 74.0, 81.0, 126.0, 187.0, 234.0, 285.0, 369.0, 429.0, 464.0, 400.0, 328.0, 261.0, 178.0, 102.0, 94.0, 66.0, 54.0, 35.0, 36.0, 19.0, 20.0, 8.0, 10.0, 11.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.921875, -12.543701171875, -12.16552734375, -11.787353515625, -11.4091796875, -11.031005859375, -10.65283203125, -10.274658203125, -9.896484375, -9.518310546875, -9.14013671875, -8.761962890625, -8.3837890625, -8.005615234375, -7.62744140625, -7.249267578125, -6.87109375, -6.492919921875, -6.11474609375, -5.736572265625, -5.3583984375, -4.980224609375, -4.60205078125, -4.223876953125, -3.845703125, -3.467529296875, -3.08935546875, -2.711181640625, -2.3330078125, -1.954833984375, -1.57666015625, -1.198486328125, -0.8203125, -0.442138671875, -0.06396484375, 0.314208984375, 0.6923828125, 1.070556640625, 1.44873046875, 1.826904296875, 2.205078125, 2.583251953125, 2.96142578125, 3.339599609375, 3.7177734375, 4.095947265625, 4.47412109375, 4.852294921875, 5.23046875, 5.608642578125, 5.98681640625, 6.364990234375, 6.7431640625, 7.121337890625, 7.49951171875, 7.877685546875, 8.255859375, 8.634033203125, 9.01220703125, 9.390380859375, 9.7685546875, 10.146728515625, 10.52490234375, 10.903076171875, 11.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 3.0, 4.0, 6.0, 10.0, 12.0, 20.0, 29.0, 26.0, 21.0, 43.0, 60.0, 61.0, 72.0, 108.0, 150.0, 191.0, 352.0, 629.0, 1605.0, 5716.0, 35793.0, 758829.0, 3246655.0, 126089.0, 12580.0, 2791.0, 988.0, 450.0, 264.0, 178.0, 117.0, 93.0, 72.0, 46.0, 46.0, 47.0, 18.0, 27.0, 13.0, 17.0, 19.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.125, -29.12890625, -28.1328125, -27.13671875, -26.140625, -25.14453125, -24.1484375, -23.15234375, -22.15625, -21.16015625, -20.1640625, -19.16796875, -18.171875, -17.17578125, -16.1796875, -15.18359375, -14.1875, -13.19140625, -12.1953125, -11.19921875, -10.203125, -9.20703125, -8.2109375, -7.21484375, -6.21875, -5.22265625, -4.2265625, -3.23046875, -2.234375, -1.23828125, -0.2421875, 0.75390625, 1.75, 2.74609375, 3.7421875, 4.73828125, 5.734375, 6.73046875, 7.7265625, 8.72265625, 9.71875, 10.71484375, 11.7109375, 12.70703125, 13.703125, 14.69921875, 15.6953125, 16.69140625, 17.6875, 18.68359375, 19.6796875, 20.67578125, 21.671875, 22.66796875, 23.6640625, 24.66015625, 25.65625, 26.65234375, 27.6484375, 28.64453125, 29.640625, 30.63671875, 31.6328125, 32.62890625, 33.625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 60.0, 212.0, 369.0, 256.0, 82.0, 21.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-257.1615295410156, -251.8807373046875, -246.59996032714844, -241.3191680908203, -236.0383758544922, -230.75759887695312, -225.476806640625, -220.19601440429688, -214.9152374267578, -209.6344451904297, -204.35366821289062, -199.0728759765625, -193.79208374023438, -188.5113067626953, -183.2305145263672, -177.94973754882812, -172.6689453125, -167.38815307617188, -162.1073760986328, -156.8265838623047, -151.54579162597656, -146.2650146484375, -140.98422241210938, -135.70343017578125, -130.42263793945312, -125.14185333251953, -119.8610610961914, -114.58027648925781, -109.29949188232422, -104.01870727539062, -98.7379150390625, -93.4571304321289, -88.17633819580078, -82.89555358886719, -77.61476135253906, -72.33397674560547, -67.05319213867188, -61.772403717041016, -56.491615295410156, -51.21083068847656, -45.9300422668457, -40.649253845214844, -35.36846923828125, -30.08768081665039, -24.806894302368164, -19.526107788085938, -14.245319366455078, -8.964534759521484, -3.683746337890625, 1.5970406532287598, 6.8778276443481445, 12.158615112304688, 17.439401626586914, 22.72018814086914, 28.0009765625, 33.281761169433594, 38.56254959106445, 43.84333801269531, 49.124122619628906, 54.404911041259766, 59.685699462890625, 64.96648406982422, 70.24726867675781, 75.52806091308594, 80.80884552001953]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 6.0, 12.0, 5.0, 11.0, 10.0, 25.0, 10.0, 19.0, 30.0, 21.0, 31.0, 25.0, 28.0, 42.0, 36.0, 34.0, 42.0, 43.0, 49.0, 39.0, 48.0, 50.0, 33.0, 30.0, 30.0, 35.0, 35.0, 30.0, 26.0, 25.0, 18.0, 25.0, 17.0, 12.0, 13.0, 9.0, 6.0, 13.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-45.03558349609375, -43.67991256713867, -42.32424545288086, -40.96857452392578, -39.61290740966797, -38.25723648071289, -36.90156555175781, -35.5458984375, -34.19023132324219, -32.83456039428711, -31.478893280029297, -30.12322235107422, -28.767555236816406, -27.411884307861328, -26.056215286254883, -24.700546264648438, -23.34487533569336, -21.989206314086914, -20.63353729248047, -19.27786636352539, -17.922199249267578, -16.5665283203125, -15.210859298706055, -13.85519027709961, -12.499521255493164, -11.143852233886719, -9.788183212280273, -8.432513236999512, -7.076844215393066, -5.721175193786621, -4.365505218505859, -3.009836196899414, -1.6541671752929688, -0.29849791526794434, 1.05717134475708, 2.4128408432006836, 3.768509864807129, 5.124178886413574, 6.479848861694336, 7.835517883300781, 9.191186904907227, 10.546855926513672, 11.902524948120117, 13.258194923400879, 14.613863945007324, 15.96953296661377, 17.32520294189453, 18.680871963500977, 20.036540985107422, 21.392210006713867, 22.747879028320312, 24.10354995727539, 25.459217071533203, 26.81488800048828, 28.170557022094727, 29.526226043701172, 30.881895065307617, 32.23756408691406, 33.59323501586914, 34.94890213012695, 36.30457305908203, 37.660240173339844, 39.01591110229492, 40.37158203125, 41.72724914550781]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 16.0, 13.0, 14.0, 15.0, 13.0, 11.0, 26.0, 29.0, 35.0, 32.0, 24.0, 22.0, 36.0, 42.0, 42.0, 32.0, 36.0, 46.0, 44.0, 44.0, 43.0, 31.0, 26.0, 30.0, 28.0, 32.0, 29.0, 22.0, 21.0, 23.0, 18.0, 11.0, 14.0, 13.0, 12.0, 7.0, 7.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.46820068359375, -6.2489013671875, -6.02960205078125, -5.810302734375, -5.59100341796875, -5.3717041015625, -5.15240478515625, -4.93310546875, -4.71380615234375, -4.4945068359375, -4.27520751953125, -4.055908203125, -3.83660888671875, -3.6173095703125, -3.39801025390625, -3.1787109375, -2.95941162109375, -2.7401123046875, -2.52081298828125, -2.301513671875, -2.08221435546875, -1.8629150390625, -1.64361572265625, -1.42431640625, -1.20501708984375, -0.9857177734375, -0.76641845703125, -0.547119140625, -0.32781982421875, -0.1085205078125, 0.11077880859375, 0.330078125, 0.54937744140625, 0.7686767578125, 0.98797607421875, 1.207275390625, 1.42657470703125, 1.6458740234375, 1.86517333984375, 2.08447265625, 2.30377197265625, 2.5230712890625, 2.74237060546875, 2.961669921875, 3.18096923828125, 3.4002685546875, 3.61956787109375, 3.8388671875, 4.05816650390625, 4.2774658203125, 4.49676513671875, 4.716064453125, 4.93536376953125, 5.1546630859375, 5.37396240234375, 5.59326171875, 5.81256103515625, 6.0318603515625, 6.25115966796875, 6.470458984375, 6.68975830078125, 6.9090576171875, 7.12835693359375, 7.34765625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 9.0, 19.0, 29.0, 25.0, 70.0, 80.0, 164.0, 233.0, 329.0, 542.0, 760.0, 1159.0, 1938.0, 2978.0, 4572.0, 7404.0, 11886.0, 19448.0, 32753.0, 55997.0, 95774.0, 155651.0, 205569.0, 174882.0, 112565.0, 65476.0, 38301.0, 22909.0, 13771.0, 8497.0, 5249.0, 3334.0, 2173.0, 1411.0, 904.0, 564.0, 359.0, 257.0, 167.0, 110.0, 67.0, 59.0, 29.0, 26.0, 15.0, 12.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.79638671875, -0.7727203369140625, -0.749053955078125, -0.7253875732421875, -0.70172119140625, -0.6780548095703125, -0.654388427734375, -0.6307220458984375, -0.6070556640625, -0.5833892822265625, -0.559722900390625, -0.5360565185546875, -0.51239013671875, -0.4887237548828125, -0.465057373046875, -0.4413909912109375, -0.417724609375, -0.3940582275390625, -0.370391845703125, -0.3467254638671875, -0.32305908203125, -0.2993927001953125, -0.275726318359375, -0.2520599365234375, -0.2283935546875, -0.2047271728515625, -0.181060791015625, -0.1573944091796875, -0.13372802734375, -0.1100616455078125, -0.086395263671875, -0.0627288818359375, -0.0390625, -0.0153961181640625, 0.008270263671875, 0.0319366455078125, 0.05560302734375, 0.0792694091796875, 0.102935791015625, 0.1266021728515625, 0.1502685546875, 0.1739349365234375, 0.197601318359375, 0.2212677001953125, 0.24493408203125, 0.2686004638671875, 0.292266845703125, 0.3159332275390625, 0.339599609375, 0.3632659912109375, 0.386932373046875, 0.4105987548828125, 0.43426513671875, 0.4579315185546875, 0.481597900390625, 0.5052642822265625, 0.5289306640625, 0.5525970458984375, 0.576263427734375, 0.5999298095703125, 0.62359619140625, 0.6472625732421875, 0.670928955078125, 0.6945953369140625, 0.71826171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 11.0, 9.0, 7.0, 10.0, 19.0, 25.0, 31.0, 17.0, 28.0, 26.0, 47.0, 36.0, 36.0, 40.0, 42.0, 31.0, 44.0, 1060.0, 42.0, 47.0, 33.0, 34.0, 35.0, 31.0, 43.0, 32.0, 26.0, 21.0, 25.0, 16.0, 23.0, 16.0, 10.0, 6.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.1015625, -4.9530029296875, -4.804443359375, -4.6558837890625, -4.50732421875, -4.3587646484375, -4.210205078125, -4.0616455078125, -3.9130859375, -3.7645263671875, -3.615966796875, -3.4674072265625, -3.31884765625, -3.1702880859375, -3.021728515625, -2.8731689453125, -2.724609375, -2.5760498046875, -2.427490234375, -2.2789306640625, -2.13037109375, -1.9818115234375, -1.833251953125, -1.6846923828125, -1.5361328125, -1.3875732421875, -1.239013671875, -1.0904541015625, -0.94189453125, -0.7933349609375, -0.644775390625, -0.4962158203125, -0.34765625, -0.1990966796875, -0.050537109375, 0.0980224609375, 0.24658203125, 0.3951416015625, 0.543701171875, 0.6922607421875, 0.8408203125, 0.9893798828125, 1.137939453125, 1.2864990234375, 1.43505859375, 1.5836181640625, 1.732177734375, 1.8807373046875, 2.029296875, 2.1778564453125, 2.326416015625, 2.4749755859375, 2.62353515625, 2.7720947265625, 2.920654296875, 3.0692138671875, 3.2177734375, 3.3663330078125, 3.514892578125, 3.6634521484375, 3.81201171875, 3.9605712890625, 4.109130859375, 4.2576904296875, 4.40625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 7.0, 22.0, 21.0, 32.0, 49.0, 79.0, 115.0, 183.0, 238.0, 449.0, 675.0, 1034.0, 1648.0, 2682.0, 4442.0, 6896.0, 11138.0, 18353.0, 29077.0, 47974.0, 78086.0, 121352.0, 164438.0, 1221834.0, 139396.0, 94849.0, 58394.0, 35932.0, 21861.0, 13284.0, 8499.0, 5203.0, 3225.0, 2033.0, 1263.0, 779.0, 567.0, 356.0, 212.0, 149.0, 93.0, 61.0, 46.0, 35.0, 18.0, 15.0, 4.0, 10.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.59375, -0.57586669921875, -0.5579833984375, -0.54010009765625, -0.522216796875, -0.50433349609375, -0.4864501953125, -0.46856689453125, -0.45068359375, -0.43280029296875, -0.4149169921875, -0.39703369140625, -0.379150390625, -0.36126708984375, -0.3433837890625, -0.32550048828125, -0.3076171875, -0.28973388671875, -0.2718505859375, -0.25396728515625, -0.236083984375, -0.21820068359375, -0.2003173828125, -0.18243408203125, -0.16455078125, -0.14666748046875, -0.1287841796875, -0.11090087890625, -0.093017578125, -0.07513427734375, -0.0572509765625, -0.03936767578125, -0.021484375, -0.00360107421875, 0.0142822265625, 0.03216552734375, 0.050048828125, 0.06793212890625, 0.0858154296875, 0.10369873046875, 0.12158203125, 0.13946533203125, 0.1573486328125, 0.17523193359375, 0.193115234375, 0.21099853515625, 0.2288818359375, 0.24676513671875, 0.2646484375, 0.28253173828125, 0.3004150390625, 0.31829833984375, 0.336181640625, 0.35406494140625, 0.3719482421875, 0.38983154296875, 0.40771484375, 0.42559814453125, 0.4434814453125, 0.46136474609375, 0.479248046875, 0.49713134765625, 0.5150146484375, 0.53289794921875, 0.55078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 4.0, 7.0, 13.0, 22.0, 16.0, 17.0, 15.0, 20.0, 27.0, 29.0, 43.0, 38.0, 50.0, 37.0, 49.0, 50.0, 54.0, 48.0, 40.0, 50.0, 39.0, 41.0, 37.0, 34.0, 34.0, 32.0, 21.0, 17.0, 15.0, 10.0, 14.0, 16.0, 16.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017518997192382812, -0.001692935824394226, -0.001633971929550171, -0.0015750080347061157, -0.0015160441398620605, -0.0014570802450180054, -0.0013981163501739502, -0.001339152455329895, -0.0012801885604858398, -0.0012212246656417847, -0.0011622607707977295, -0.0011032968759536743, -0.0010443329811096191, -0.000985369086265564, -0.0009264051914215088, -0.0008674412965774536, -0.0008084774017333984, -0.0007495135068893433, -0.0006905496120452881, -0.0006315857172012329, -0.0005726218223571777, -0.0005136579275131226, -0.0004546940326690674, -0.0003957301378250122, -0.00033676624298095703, -0.00027780234813690186, -0.00021883845329284668, -0.0001598745584487915, -0.00010091066360473633, -4.194676876068115e-05, 1.7017126083374023e-05, 7.59810209274292e-05, 0.00013494491577148438, 0.00019390881061553955, 0.0002528727054595947, 0.0003118366003036499, 0.0003708004951477051, 0.00042976438999176025, 0.0004887282848358154, 0.0005476921796798706, 0.0006066560745239258, 0.000665619969367981, 0.0007245838642120361, 0.0007835477590560913, 0.0008425116539001465, 0.0009014755487442017, 0.0009604394435882568, 0.001019403338432312, 0.0010783672332763672, 0.0011373311281204224, 0.0011962950229644775, 0.0012552589178085327, 0.0013142228126525879, 0.001373186707496643, 0.0014321506023406982, 0.0014911144971847534, 0.0015500783920288086, 0.0016090422868728638, 0.001668006181716919, 0.0017269700765609741, 0.0017859339714050293, 0.0018448978662490845, 0.0019038617610931396, 0.001962825655937195, 0.00202178955078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 13.0, 19.0, 14.0, 17.0, 20.0, 30.0, 27.0, 31.0, 58.0, 68.0, 86.0, 123.0, 155.0, 223.0, 450.0, 1180.0, 65527.0, 972343.0, 6360.0, 682.0, 337.0, 199.0, 126.0, 93.0, 63.0, 53.0, 52.0, 34.0, 31.0, 24.0, 16.0, 18.0, 10.0, 14.0, 8.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0], "bins": [-0.044769287109375, -0.043535709381103516, -0.04230213165283203, -0.04106855392456055, -0.03983497619628906, -0.03860139846801758, -0.037367820739746094, -0.03613424301147461, -0.034900665283203125, -0.03366708755493164, -0.032433509826660156, -0.031199932098388672, -0.029966354370117188, -0.028732776641845703, -0.02749919891357422, -0.026265621185302734, -0.02503204345703125, -0.023798465728759766, -0.02256488800048828, -0.021331310272216797, -0.020097732543945312, -0.018864154815673828, -0.017630577087402344, -0.01639699935913086, -0.015163421630859375, -0.01392984390258789, -0.012696266174316406, -0.011462688446044922, -0.010229110717773438, -0.008995532989501953, -0.007761955261230469, -0.006528377532958984, -0.0052947998046875, -0.004061222076416016, -0.0028276443481445312, -0.0015940666198730469, -0.0003604888916015625, 0.0008730888366699219, 0.0021066665649414062, 0.0033402442932128906, 0.004573822021484375, 0.005807399749755859, 0.007040977478027344, 0.008274555206298828, 0.009508132934570312, 0.010741710662841797, 0.011975288391113281, 0.013208866119384766, 0.01444244384765625, 0.015676021575927734, 0.01690959930419922, 0.018143177032470703, 0.019376754760742188, 0.020610332489013672, 0.021843910217285156, 0.02307748794555664, 0.024311065673828125, 0.02554464340209961, 0.026778221130371094, 0.028011798858642578, 0.029245376586914062, 0.030478954315185547, 0.03171253204345703, 0.032946109771728516, 0.0341796875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 14.0, 36.0, 60.0, 184.0, 279.0, 260.0, 136.0, 28.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0051488433964550495, -0.00503904465585947, -0.004929245915263891, -0.004819447174668312, -0.00470964889973402, -0.004599850159138441, -0.004490051418542862, -0.004380252677947283, -0.004270453937351704, -0.0041606551967561245, -0.004050856456160545, -0.0039410581812262535, -0.0038312592078000307, -0.003721460700035095, -0.003611661959439516, -0.003501863218843937, -0.0033920647110790014, -0.0032822659704834223, -0.003172467462718487, -0.0030626687221229076, -0.0029528699815273285, -0.0028430712409317493, -0.002733272733166814, -0.0026234739925712347, -0.002513675484806299, -0.00240387674421072, -0.0022940782364457846, -0.0021842794958502054, -0.0020744807552546263, -0.0019646822474896908, -0.0018548835068941116, -0.0017450847662985325, -0.0016352861421182752, -0.0015254875179380178, -0.0014156887773424387, -0.0013058901531621814, -0.001196091528981924, -0.001086292788386345, -0.0009764941642060876, -0.0008666954818181694, -0.0007568967994302511, -0.0006470981170423329, -0.0005372994346544147, -0.00042750081047415733, -0.0003177021280862391, -0.00020790344569832087, -9.810482151806355e-05, 1.1693860869854689e-05, 0.00012149254325777292, 0.00023129121109377593, 0.00034108987892977893, 0.0004508885322138667, 0.0005606872146017849, 0.0006704858969897032, 0.0007802845211699605, 0.0008900832035578787, 0.000999881885945797, 0.0011096805101260543, 0.0012194792507216334, 0.0013292778749018908, 0.00143907661549747, 0.0015488752396777272, 0.0016586738638579845, 0.0017684726044535637, 0.001878271228633821]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 7.0, 5.0, 10.0, 9.0, 11.0, 17.0, 30.0, 23.0, 16.0, 31.0, 32.0, 37.0, 50.0, 43.0, 51.0, 44.0, 61.0, 51.0, 51.0, 43.0, 44.0, 51.0, 43.0, 31.0, 32.0, 29.0, 22.0, 19.0, 26.0, 22.0, 9.0, 7.0, 8.0, 11.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012853741645812988, -0.0012443633750081062, -0.0012033525854349136, -0.001162341795861721, -0.0011213310062885284, -0.0010803202167153358, -0.0010393094271421432, -0.0009982986375689507, -0.0009572878479957581, -0.0009162770584225655, -0.0008752662688493729, -0.0008342554792761803, -0.0007932446897029877, -0.0007522339001297951, -0.0007112231105566025, -0.0006702123209834099, -0.0006292015314102173, -0.0005881907418370247, -0.0005471799522638321, -0.0005061691626906395, -0.0004651583731174469, -0.0004241475835442543, -0.0003831367939710617, -0.0003421260043978691, -0.0003011152148246765, -0.0002601044252514839, -0.00021909363567829132, -0.00017808284610509872, -0.00013707205653190613, -9.606126695871353e-05, -5.5050477385520935e-05, -1.4039687812328339e-05, 2.6971101760864258e-05, 6.798189133405685e-05, 0.00010899268090724945, 0.00015000347048044205, 0.00019101426005363464, 0.00023202504962682724, 0.00027303583920001984, 0.00031404662877321243, 0.00035505741834640503, 0.0003960682079195976, 0.0004370789974927902, 0.0004780897870659828, 0.0005191005766391754, 0.000560111366212368, 0.0006011221557855606, 0.0006421329453587532, 0.0006831437349319458, 0.0007241545245051384, 0.000765165314078331, 0.0008061761036515236, 0.0008471868932247162, 0.0008881976827979088, 0.0009292084723711014, 0.000970219261944294, 0.0010112300515174866, 0.0010522408410906792, 0.0010932516306638718, 0.0011342624202370644, 0.001175273209810257, 0.0012162839993834496, 0.0012572947889566422, 0.0012983055785298347, 0.0013393163681030273]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 16.0, 13.0, 14.0, 15.0, 13.0, 11.0, 26.0, 29.0, 35.0, 32.0, 24.0, 22.0, 36.0, 42.0, 41.0, 33.0, 36.0, 46.0, 44.0, 44.0, 43.0, 31.0, 26.0, 30.0, 28.0, 32.0, 29.0, 22.0, 21.0, 23.0, 18.0, 11.0, 14.0, 13.0, 12.0, 7.0, 7.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.46820068359375, -6.2489013671875, -6.02960205078125, -5.810302734375, -5.59100341796875, -5.3717041015625, -5.15240478515625, -4.93310546875, -4.71380615234375, -4.4945068359375, -4.27520751953125, -4.055908203125, -3.83660888671875, -3.6173095703125, -3.39801025390625, -3.1787109375, -2.95941162109375, -2.7401123046875, -2.52081298828125, -2.301513671875, -2.08221435546875, -1.8629150390625, -1.64361572265625, -1.42431640625, -1.20501708984375, -0.9857177734375, -0.76641845703125, -0.547119140625, -0.32781982421875, -0.1085205078125, 0.11077880859375, 0.330078125, 0.54937744140625, 0.7686767578125, 0.98797607421875, 1.207275390625, 1.42657470703125, 1.6458740234375, 1.86517333984375, 2.08447265625, 2.30377197265625, 2.5230712890625, 2.74237060546875, 2.961669921875, 3.18096923828125, 3.4002685546875, 3.61956787109375, 3.8388671875, 4.05816650390625, 4.2774658203125, 4.49676513671875, 4.716064453125, 4.93536376953125, 5.1546630859375, 5.37396240234375, 5.59326171875, 5.81256103515625, 6.0318603515625, 6.25115966796875, 6.470458984375, 6.68975830078125, 6.9090576171875, 7.12835693359375, 7.34765625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 9.0, 3.0, 5.0, 12.0, 9.0, 9.0, 24.0, 26.0, 30.0, 45.0, 38.0, 74.0, 61.0, 109.0, 147.0, 209.0, 275.0, 322.0, 422.0, 650.0, 1187.0, 3344.0, 15247.0, 97061.0, 814068.0, 93484.0, 14709.0, 3355.0, 1117.0, 651.0, 426.0, 314.0, 279.0, 212.0, 154.0, 111.0, 84.0, 69.0, 41.0, 27.0, 34.0, 21.0, 18.0, 14.0, 14.0, 8.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.90625, -16.351806640625, -15.79736328125, -15.242919921875, -14.6884765625, -14.134033203125, -13.57958984375, -13.025146484375, -12.470703125, -11.916259765625, -11.36181640625, -10.807373046875, -10.2529296875, -9.698486328125, -9.14404296875, -8.589599609375, -8.03515625, -7.480712890625, -6.92626953125, -6.371826171875, -5.8173828125, -5.262939453125, -4.70849609375, -4.154052734375, -3.599609375, -3.045166015625, -2.49072265625, -1.936279296875, -1.3818359375, -0.827392578125, -0.27294921875, 0.281494140625, 0.8359375, 1.390380859375, 1.94482421875, 2.499267578125, 3.0537109375, 3.608154296875, 4.16259765625, 4.717041015625, 5.271484375, 5.825927734375, 6.38037109375, 6.934814453125, 7.4892578125, 8.043701171875, 8.59814453125, 9.152587890625, 9.70703125, 10.261474609375, 10.81591796875, 11.370361328125, 11.9248046875, 12.479248046875, 13.03369140625, 13.588134765625, 14.142578125, 14.697021484375, 15.25146484375, 15.805908203125, 16.3603515625, 16.914794921875, 17.46923828125, 18.023681640625, 18.578125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 5.0, 4.0, 10.0, 9.0, 18.0, 17.0, 22.0, 11.0, 15.0, 26.0, 24.0, 32.0, 34.0, 35.0, 53.0, 46.0, 52.0, 103.0, 245.0, 1639.0, 131.0, 71.0, 58.0, 48.0, 42.0, 28.0, 42.0, 31.0, 21.0, 30.0, 19.0, 26.0, 15.0, 11.0, 15.0, 14.0, 11.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.015625, -20.2724609375, -19.529296875, -18.7861328125, -18.04296875, -17.2998046875, -16.556640625, -15.8134765625, -15.0703125, -14.3271484375, -13.583984375, -12.8408203125, -12.09765625, -11.3544921875, -10.611328125, -9.8681640625, -9.125, -8.3818359375, -7.638671875, -6.8955078125, -6.15234375, -5.4091796875, -4.666015625, -3.9228515625, -3.1796875, -2.4365234375, -1.693359375, -0.9501953125, -0.20703125, 0.5361328125, 1.279296875, 2.0224609375, 2.765625, 3.5087890625, 4.251953125, 4.9951171875, 5.73828125, 6.4814453125, 7.224609375, 7.9677734375, 8.7109375, 9.4541015625, 10.197265625, 10.9404296875, 11.68359375, 12.4267578125, 13.169921875, 13.9130859375, 14.65625, 15.3994140625, 16.142578125, 16.8857421875, 17.62890625, 18.3720703125, 19.115234375, 19.8583984375, 20.6015625, 21.3447265625, 22.087890625, 22.8310546875, 23.57421875, 24.3173828125, 25.060546875, 25.8037109375, 26.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 18.0, 16.0, 20.0, 23.0, 26.0, 33.0, 35.0, 45.0, 59.0, 80.0, 112.0, 196.0, 354.0, 998.0, 8473.0, 3081142.0, 50944.0, 1787.0, 517.0, 235.0, 137.0, 90.0, 63.0, 44.0, 35.0, 29.0, 17.0, 23.0, 24.0, 19.0, 18.0, 11.0, 7.0, 9.0, 2.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-74.625, -72.4736328125, -70.322265625, -68.1708984375, -66.01953125, -63.8681640625, -61.716796875, -59.5654296875, -57.4140625, -55.2626953125, -53.111328125, -50.9599609375, -48.80859375, -46.6572265625, -44.505859375, -42.3544921875, -40.203125, -38.0517578125, -35.900390625, -33.7490234375, -31.59765625, -29.4462890625, -27.294921875, -25.1435546875, -22.9921875, -20.8408203125, -18.689453125, -16.5380859375, -14.38671875, -12.2353515625, -10.083984375, -7.9326171875, -5.78125, -3.6298828125, -1.478515625, 0.6728515625, 2.82421875, 4.9755859375, 7.126953125, 9.2783203125, 11.4296875, 13.5810546875, 15.732421875, 17.8837890625, 20.03515625, 22.1865234375, 24.337890625, 26.4892578125, 28.640625, 30.7919921875, 32.943359375, 35.0947265625, 37.24609375, 39.3974609375, 41.548828125, 43.7001953125, 45.8515625, 48.0029296875, 50.154296875, 52.3056640625, 54.45703125, 56.6083984375, 58.759765625, 60.9111328125, 63.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 243.0, 601.0, 160.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.7018814086914, -120.00689697265625, -116.3119125366211, -112.61692810058594, -108.92194366455078, -105.22695922851562, -101.53197479248047, -97.83699035644531, -94.14200592041016, -90.447021484375, -86.75203704833984, -83.05705261230469, -79.36206817626953, -75.66708374023438, -71.97209930419922, -68.27711486816406, -64.58212280273438, -60.88713836669922, -57.19215393066406, -53.497169494628906, -49.80218505859375, -46.107200622558594, -42.41221618652344, -38.71723175048828, -35.022247314453125, -31.32726287841797, -27.632278442382812, -23.937294006347656, -20.2423095703125, -16.54732322692871, -12.852338790893555, -9.157354354858398, -5.462371826171875, -1.7673871517181396, 1.9275975227355957, 5.62258243560791, 9.317566871643066, 13.012552261352539, 16.707536697387695, 20.40252113342285, 24.097505569458008, 27.792490005493164, 31.48747444152832, 35.18246078491211, 38.877445220947266, 42.57242965698242, 46.26741409301758, 49.962398529052734, 53.65738296508789, 57.35236740112305, 61.0473518371582, 64.74234008789062, 68.43732452392578, 72.13230895996094, 75.8272933959961, 79.52227783203125, 83.2172622680664, 86.91224670410156, 90.60723114013672, 94.30221557617188, 97.99720001220703, 101.69218444824219, 105.38716888427734, 109.0821533203125, 112.77713775634766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 7.0, 6.0, 8.0, 8.0, 8.0, 10.0, 21.0, 14.0, 28.0, 20.0, 29.0, 27.0, 24.0, 40.0, 39.0, 37.0, 34.0, 43.0, 45.0, 30.0, 42.0, 40.0, 51.0, 31.0, 45.0, 33.0, 33.0, 31.0, 15.0, 22.0, 17.0, 13.0, 24.0, 13.0, 20.0, 12.0, 13.0, 4.0, 14.0, 6.0, 4.0, 10.0, 5.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 4.0], "bins": [-58.57500076293945, -56.92686080932617, -55.27872085571289, -53.63058090209961, -51.98244094848633, -50.33430099487305, -48.6861572265625, -47.03801727294922, -45.38987731933594, -43.741737365722656, -42.093597412109375, -40.445457458496094, -38.79731750488281, -37.14917755126953, -35.50103759765625, -33.85289764404297, -32.20475769042969, -30.556617736816406, -28.908477783203125, -27.260337829589844, -25.612197875976562, -23.96405792236328, -22.315916061401367, -20.667776107788086, -19.019636154174805, -17.371496200561523, -15.723356246948242, -14.075215339660645, -12.427075386047363, -10.778935432434082, -9.130794525146484, -7.482654571533203, -5.8345184326171875, -4.186378479003906, -2.538238048553467, -0.8900976181030273, 0.7580423355102539, 2.406182289123535, 4.054323196411133, 5.702463150024414, 7.350603103637695, 8.998743057250977, 10.646883010864258, 12.295023918151855, 13.943163871765137, 15.591303825378418, 17.239444732666016, 18.887584686279297, 20.535724639892578, 22.18386459350586, 23.83200454711914, 25.480144500732422, 27.128284454345703, 28.776424407958984, 30.4245662689209, 32.07270812988281, 33.720848083496094, 35.368988037109375, 37.017127990722656, 38.66526794433594, 40.31340789794922, 41.9615478515625, 43.60968780517578, 45.25782775878906, 46.905967712402344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 8.0, 6.0, 8.0, 12.0, 11.0, 13.0, 20.0, 26.0, 22.0, 21.0, 26.0, 30.0, 31.0, 34.0, 20.0, 29.0, 38.0, 38.0, 32.0, 40.0, 46.0, 39.0, 33.0, 36.0, 34.0, 28.0, 39.0, 38.0, 23.0, 28.0, 21.0, 24.0, 18.0, 14.0, 15.0, 13.0, 16.0, 11.0, 11.0, 7.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.7578125, -6.5355224609375, -6.313232421875, -6.0909423828125, -5.86865234375, -5.6463623046875, -5.424072265625, -5.2017822265625, -4.9794921875, -4.7572021484375, -4.534912109375, -4.3126220703125, -4.09033203125, -3.8680419921875, -3.645751953125, -3.4234619140625, -3.201171875, -2.9788818359375, -2.756591796875, -2.5343017578125, -2.31201171875, -2.0897216796875, -1.867431640625, -1.6451416015625, -1.4228515625, -1.2005615234375, -0.978271484375, -0.7559814453125, -0.53369140625, -0.3114013671875, -0.089111328125, 0.1331787109375, 0.35546875, 0.5777587890625, 0.800048828125, 1.0223388671875, 1.24462890625, 1.4669189453125, 1.689208984375, 1.9114990234375, 2.1337890625, 2.3560791015625, 2.578369140625, 2.8006591796875, 3.02294921875, 3.2452392578125, 3.467529296875, 3.6898193359375, 3.912109375, 4.1343994140625, 4.356689453125, 4.5789794921875, 4.80126953125, 5.0235595703125, 5.245849609375, 5.4681396484375, 5.6904296875, 5.9127197265625, 6.135009765625, 6.3572998046875, 6.57958984375, 6.8018798828125, 7.024169921875, 7.2464599609375, 7.46875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 6.0, 15.0, 17.0, 24.0, 28.0, 25.0, 57.0, 73.0, 91.0, 135.0, 182.0, 276.0, 428.0, 696.0, 1214.0, 2447.0, 5449.0, 16746.0, 79677.0, 576468.0, 2175978.0, 1130890.0, 159325.0, 28361.0, 8315.0, 3280.0, 1594.0, 845.0, 504.0, 327.0, 222.0, 129.0, 114.0, 87.0, 61.0, 34.0, 35.0, 29.0, 19.0, 22.0, 9.0, 6.0, 10.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-14.1953125, -13.77392578125, -13.3525390625, -12.93115234375, -12.509765625, -12.08837890625, -11.6669921875, -11.24560546875, -10.82421875, -10.40283203125, -9.9814453125, -9.56005859375, -9.138671875, -8.71728515625, -8.2958984375, -7.87451171875, -7.453125, -7.03173828125, -6.6103515625, -6.18896484375, -5.767578125, -5.34619140625, -4.9248046875, -4.50341796875, -4.08203125, -3.66064453125, -3.2392578125, -2.81787109375, -2.396484375, -1.97509765625, -1.5537109375, -1.13232421875, -0.7109375, -0.28955078125, 0.1318359375, 0.55322265625, 0.974609375, 1.39599609375, 1.8173828125, 2.23876953125, 2.66015625, 3.08154296875, 3.5029296875, 3.92431640625, 4.345703125, 4.76708984375, 5.1884765625, 5.60986328125, 6.03125, 6.45263671875, 6.8740234375, 7.29541015625, 7.716796875, 8.13818359375, 8.5595703125, 8.98095703125, 9.40234375, 9.82373046875, 10.2451171875, 10.66650390625, 11.087890625, 11.50927734375, 11.9306640625, 12.35205078125, 12.7734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 8.0, 5.0, 23.0, 22.0, 47.0, 62.0, 92.0, 138.0, 188.0, 300.0, 434.0, 525.0, 589.0, 465.0, 367.0, 262.0, 160.0, 94.0, 69.0, 54.0, 46.0, 43.0, 16.0, 9.0, 11.0, 7.0, 5.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -16.1220703125, -15.650390625, -15.1787109375, -14.70703125, -14.2353515625, -13.763671875, -13.2919921875, -12.8203125, -12.3486328125, -11.876953125, -11.4052734375, -10.93359375, -10.4619140625, -9.990234375, -9.5185546875, -9.046875, -8.5751953125, -8.103515625, -7.6318359375, -7.16015625, -6.6884765625, -6.216796875, -5.7451171875, -5.2734375, -4.8017578125, -4.330078125, -3.8583984375, -3.38671875, -2.9150390625, -2.443359375, -1.9716796875, -1.5, -1.0283203125, -0.556640625, -0.0849609375, 0.38671875, 0.8583984375, 1.330078125, 1.8017578125, 2.2734375, 2.7451171875, 3.216796875, 3.6884765625, 4.16015625, 4.6318359375, 5.103515625, 5.5751953125, 6.046875, 6.5185546875, 6.990234375, 7.4619140625, 7.93359375, 8.4052734375, 8.876953125, 9.3486328125, 9.8203125, 10.2919921875, 10.763671875, 11.2353515625, 11.70703125, 12.1787109375, 12.650390625, 13.1220703125, 13.59375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 11.0, 5.0, 8.0, 14.0, 15.0, 20.0, 31.0, 42.0, 50.0, 104.0, 132.0, 204.0, 355.0, 822.0, 2317.0, 12765.0, 290510.0, 3752640.0, 122810.0, 8224.0, 1714.0, 668.0, 310.0, 191.0, 113.0, 70.0, 32.0, 38.0, 19.0, 16.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.875, -44.541015625, -43.20703125, -41.873046875, -40.5390625, -39.205078125, -37.87109375, -36.537109375, -35.203125, -33.869140625, -32.53515625, -31.201171875, -29.8671875, -28.533203125, -27.19921875, -25.865234375, -24.53125, -23.197265625, -21.86328125, -20.529296875, -19.1953125, -17.861328125, -16.52734375, -15.193359375, -13.859375, -12.525390625, -11.19140625, -9.857421875, -8.5234375, -7.189453125, -5.85546875, -4.521484375, -3.1875, -1.853515625, -0.51953125, 0.814453125, 2.1484375, 3.482421875, 4.81640625, 6.150390625, 7.484375, 8.818359375, 10.15234375, 11.486328125, 12.8203125, 14.154296875, 15.48828125, 16.822265625, 18.15625, 19.490234375, 20.82421875, 22.158203125, 23.4921875, 24.826171875, 26.16015625, 27.494140625, 28.828125, 30.162109375, 31.49609375, 32.830078125, 34.1640625, 35.498046875, 36.83203125, 38.166015625, 39.5]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 716.0, 286.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-367.4073181152344, -350.5296630859375, -333.6520080566406, -316.77435302734375, -299.8966979980469, -283.01904296875, -266.141357421875, -249.2637176513672, -232.3860626220703, -215.50840759277344, -198.63075256347656, -181.75308227539062, -164.87542724609375, -147.99777221679688, -131.1201171875, -114.24246215820312, -97.36480712890625, -80.48715209960938, -63.609493255615234, -46.731834411621094, -29.85417938232422, -12.976524353027344, 3.9011383056640625, 20.778793334960938, 37.65644836425781, 54.53410339355469, 71.41175842285156, 88.28942108154297, 105.16707611083984, 122.04473114013672, 138.92239379882812, 155.800048828125, 172.67767333984375, 189.55532836914062, 206.4329833984375, 223.31063842773438, 240.18829345703125, 257.0659484863281, 273.943603515625, 290.8212890625, 307.69891357421875, 324.5765686035156, 341.4542236328125, 358.3318786621094, 375.20953369140625, 392.0871887207031, 408.96484375, 425.842529296875, 442.7201843261719, 459.59783935546875, 476.4754943847656, 493.3531494140625, 510.2308044433594, 527.1084594726562, 543.9861450195312, 560.86376953125, 577.741455078125, 594.619140625, 611.4967651367188, 628.3744506835938, 645.2520751953125, 662.1297607421875, 679.0073852539062, 695.8850708007812, 712.7626953125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 5.0, 8.0, 8.0, 14.0, 20.0, 12.0, 17.0, 20.0, 24.0, 29.0, 30.0, 34.0, 47.0, 34.0, 34.0, 30.0, 32.0, 50.0, 38.0, 34.0, 44.0, 45.0, 34.0, 44.0, 39.0, 33.0, 29.0, 31.0, 29.0, 26.0, 17.0, 22.0, 9.0, 8.0, 10.0, 7.0, 9.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.06842041015625, -38.75014114379883, -37.431861877441406, -36.113582611083984, -34.79530334472656, -33.47702407836914, -32.15874481201172, -30.840465545654297, -29.522186279296875, -28.203907012939453, -26.88562774658203, -25.56734848022461, -24.249069213867188, -22.930789947509766, -21.612510681152344, -20.294231414794922, -18.9759521484375, -17.657672882080078, -16.339393615722656, -15.021114349365234, -13.702835083007812, -12.38455581665039, -11.066276550292969, -9.747997283935547, -8.429718017578125, -7.111438751220703, -5.793159484863281, -4.474880218505859, -3.1566009521484375, -1.8383216857910156, -0.5200424194335938, 0.7982368469238281, 2.11651611328125, 3.434795379638672, 4.753074645996094, 6.071353912353516, 7.3896331787109375, 8.70791244506836, 10.026191711425781, 11.344470977783203, 12.662750244140625, 13.981029510498047, 15.299308776855469, 16.61758804321289, 17.935867309570312, 19.254146575927734, 20.572425842285156, 21.890705108642578, 23.208984375, 24.527263641357422, 25.845542907714844, 27.163822174072266, 28.482101440429688, 29.80038070678711, 31.11865997314453, 32.43693923950195, 33.755218505859375, 35.0734977722168, 36.39177703857422, 37.71005630493164, 39.02833557128906, 40.346614837646484, 41.664894104003906, 42.98317337036133, 44.30145263671875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 8.0, 10.0, 7.0, 9.0, 13.0, 24.0, 21.0, 30.0, 20.0, 21.0, 35.0, 33.0, 20.0, 28.0, 37.0, 33.0, 40.0, 31.0, 38.0, 44.0, 52.0, 34.0, 35.0, 41.0, 36.0, 26.0, 29.0, 32.0, 32.0, 26.0, 17.0, 22.0, 12.0, 13.0, 13.0, 17.0, 6.0, 9.0, 8.0, 0.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.98828125, -7.74749755859375, -7.5067138671875, -7.26593017578125, -7.025146484375, -6.78436279296875, -6.5435791015625, -6.30279541015625, -6.06201171875, -5.82122802734375, -5.5804443359375, -5.33966064453125, -5.098876953125, -4.85809326171875, -4.6173095703125, -4.37652587890625, -4.1357421875, -3.89495849609375, -3.6541748046875, -3.41339111328125, -3.172607421875, -2.93182373046875, -2.6910400390625, -2.45025634765625, -2.20947265625, -1.96868896484375, -1.7279052734375, -1.48712158203125, -1.246337890625, -1.00555419921875, -0.7647705078125, -0.52398681640625, -0.283203125, -0.04241943359375, 0.1983642578125, 0.43914794921875, 0.679931640625, 0.92071533203125, 1.1614990234375, 1.40228271484375, 1.64306640625, 1.88385009765625, 2.1246337890625, 2.36541748046875, 2.606201171875, 2.84698486328125, 3.0877685546875, 3.32855224609375, 3.5693359375, 3.81011962890625, 4.0509033203125, 4.29168701171875, 4.532470703125, 4.77325439453125, 5.0140380859375, 5.25482177734375, 5.49560546875, 5.73638916015625, 5.9771728515625, 6.21795654296875, 6.458740234375, 6.69952392578125, 6.9403076171875, 7.18109130859375, 7.421875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 13.0, 11.0, 25.0, 35.0, 55.0, 87.0, 112.0, 173.0, 273.0, 388.0, 578.0, 807.0, 1263.0, 1872.0, 2897.0, 4359.0, 6648.0, 10513.0, 16537.0, 27490.0, 45789.0, 77779.0, 125617.0, 180698.0, 187633.0, 138032.0, 86117.0, 51082.0, 30249.0, 18225.0, 11575.0, 7461.0, 4786.0, 3103.0, 2069.0, 1436.0, 905.0, 598.0, 422.0, 270.0, 185.0, 126.0, 102.0, 53.0, 34.0, 23.0, 16.0, 12.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.78369140625, -0.7600173950195312, -0.7363433837890625, -0.7126693725585938, -0.688995361328125, -0.6653213500976562, -0.6416473388671875, -0.6179733276367188, -0.59429931640625, -0.5706253051757812, -0.5469512939453125, -0.5232772827148438, -0.499603271484375, -0.47592926025390625, -0.4522552490234375, -0.42858123779296875, -0.4049072265625, -0.38123321533203125, -0.3575592041015625, -0.33388519287109375, -0.310211181640625, -0.28653717041015625, -0.2628631591796875, -0.23918914794921875, -0.21551513671875, -0.19184112548828125, -0.1681671142578125, -0.14449310302734375, -0.120819091796875, -0.09714508056640625, -0.0734710693359375, -0.04979705810546875, -0.026123046875, -0.00244903564453125, 0.0212249755859375, 0.04489898681640625, 0.068572998046875, 0.09224700927734375, 0.1159210205078125, 0.13959503173828125, 0.16326904296875, 0.18694305419921875, 0.2106170654296875, 0.23429107666015625, 0.257965087890625, 0.28163909912109375, 0.3053131103515625, 0.32898712158203125, 0.3526611328125, 0.37633514404296875, 0.4000091552734375, 0.42368316650390625, 0.447357177734375, 0.47103118896484375, 0.4947052001953125, 0.5183792114257812, 0.54205322265625, 0.5657272338867188, 0.5894012451171875, 0.6130752563476562, 0.636749267578125, 0.6604232788085938, 0.6840972900390625, 0.7077713012695312, 0.7314453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 9.0, 4.0, 6.0, 12.0, 15.0, 13.0, 17.0, 19.0, 18.0, 22.0, 29.0, 37.0, 27.0, 37.0, 35.0, 36.0, 34.0, 32.0, 27.0, 30.0, 1058.0, 48.0, 45.0, 43.0, 29.0, 31.0, 32.0, 22.0, 25.0, 22.0, 39.0, 12.0, 20.0, 16.0, 16.0, 13.0, 16.0, 10.0, 14.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.09765625, -4.94769287109375, -4.7977294921875, -4.64776611328125, -4.497802734375, -4.34783935546875, -4.1978759765625, -4.04791259765625, -3.89794921875, -3.74798583984375, -3.5980224609375, -3.44805908203125, -3.298095703125, -3.14813232421875, -2.9981689453125, -2.84820556640625, -2.6982421875, -2.54827880859375, -2.3983154296875, -2.24835205078125, -2.098388671875, -1.94842529296875, -1.7984619140625, -1.64849853515625, -1.49853515625, -1.34857177734375, -1.1986083984375, -1.04864501953125, -0.898681640625, -0.74871826171875, -0.5987548828125, -0.44879150390625, -0.298828125, -0.14886474609375, 0.0010986328125, 0.15106201171875, 0.301025390625, 0.45098876953125, 0.6009521484375, 0.75091552734375, 0.90087890625, 1.05084228515625, 1.2008056640625, 1.35076904296875, 1.500732421875, 1.65069580078125, 1.8006591796875, 1.95062255859375, 2.1005859375, 2.25054931640625, 2.4005126953125, 2.55047607421875, 2.700439453125, 2.85040283203125, 3.0003662109375, 3.15032958984375, 3.30029296875, 3.45025634765625, 3.6002197265625, 3.75018310546875, 3.900146484375, 4.05010986328125, 4.2000732421875, 4.35003662109375, 4.5]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 10.0, 14.0, 20.0, 37.0, 49.0, 76.0, 140.0, 241.0, 399.0, 676.0, 1133.0, 2069.0, 3348.0, 6072.0, 10639.0, 18910.0, 34426.0, 62684.0, 114473.0, 185902.0, 1267125.0, 168168.0, 99536.0, 54339.0, 29228.0, 15987.0, 9276.0, 5073.0, 3015.0, 1668.0, 983.0, 542.0, 336.0, 195.0, 135.0, 79.0, 44.0, 29.0, 15.0, 14.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.6224441528320312, -0.5979156494140625, -0.5733871459960938, -0.548858642578125, -0.5243301391601562, -0.4998016357421875, -0.47527313232421875, -0.45074462890625, -0.42621612548828125, -0.4016876220703125, -0.37715911865234375, -0.352630615234375, -0.32810211181640625, -0.3035736083984375, -0.27904510498046875, -0.2545166015625, -0.22998809814453125, -0.2054595947265625, -0.18093109130859375, -0.156402587890625, -0.13187408447265625, -0.1073455810546875, -0.08281707763671875, -0.05828857421875, -0.03376007080078125, -0.0092315673828125, 0.01529693603515625, 0.039825439453125, 0.06435394287109375, 0.0888824462890625, 0.11341094970703125, 0.137939453125, 0.16246795654296875, 0.1869964599609375, 0.21152496337890625, 0.236053466796875, 0.26058197021484375, 0.2851104736328125, 0.30963897705078125, 0.33416748046875, 0.35869598388671875, 0.3832244873046875, 0.40775299072265625, 0.432281494140625, 0.45680999755859375, 0.4813385009765625, 0.5058670043945312, 0.5303955078125, 0.5549240112304688, 0.5794525146484375, 0.6039810180664062, 0.628509521484375, 0.6530380249023438, 0.6775665283203125, 0.7020950317382812, 0.72662353515625, 0.7511520385742188, 0.7756805419921875, 0.8002090454101562, 0.824737548828125, 0.8492660522460938, 0.8737945556640625, 0.8983230590820312, 0.9228515625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 7.0, 4.0, 3.0, 8.0, 10.0, 13.0, 22.0, 12.0, 21.0, 26.0, 25.0, 31.0, 51.0, 43.0, 34.0, 52.0, 58.0, 64.0, 51.0, 56.0, 53.0, 48.0, 44.0, 52.0, 30.0, 28.0, 28.0, 22.0, 18.0, 17.0, 13.0, 12.0, 11.0, 8.0, 10.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0026569366455078125, -0.0025802552700042725, -0.0025035738945007324, -0.0024268925189971924, -0.0023502111434936523, -0.0022735297679901123, -0.0021968483924865723, -0.0021201670169830322, -0.002043485641479492, -0.001966804265975952, -0.0018901228904724121, -0.001813441514968872, -0.001736760139465332, -0.001660078763961792, -0.001583397388458252, -0.001506716012954712, -0.0014300346374511719, -0.0013533532619476318, -0.0012766718864440918, -0.0011999905109405518, -0.0011233091354370117, -0.0010466277599334717, -0.0009699463844299316, -0.0008932650089263916, -0.0008165836334228516, -0.0007399022579193115, -0.0006632208824157715, -0.0005865395069122314, -0.0005098581314086914, -0.00043317675590515137, -0.00035649538040161133, -0.0002798140048980713, -0.00020313262939453125, -0.0001264512538909912, -4.976987838745117e-05, 2.6911497116088867e-05, 0.0001035928726196289, 0.00018027424812316895, 0.000256955623626709, 0.000333636999130249, 0.00041031837463378906, 0.0004869997501373291, 0.0005636811256408691, 0.0006403625011444092, 0.0007170438766479492, 0.0007937252521514893, 0.0008704066276550293, 0.0009470880031585693, 0.0010237693786621094, 0.0011004507541656494, 0.0011771321296691895, 0.0012538135051727295, 0.0013304948806762695, 0.0014071762561798096, 0.0014838576316833496, 0.0015605390071868896, 0.0016372203826904297, 0.0017139017581939697, 0.0017905831336975098, 0.0018672645092010498, 0.0019439458847045898, 0.00202062726020813, 0.00209730863571167, 0.00217399001121521, 0.00225067138671875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 5.0, 12.0, 17.0, 22.0, 20.0, 30.0, 51.0, 59.0, 61.0, 79.0, 123.0, 207.0, 364.0, 721.0, 13790.0, 1022870.0, 8244.0, 686.0, 406.0, 192.0, 140.0, 94.0, 83.0, 61.0, 38.0, 37.0, 31.0, 19.0, 16.0, 15.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04779052734375, -0.04616832733154297, -0.04454612731933594, -0.042923927307128906, -0.041301727294921875, -0.039679527282714844, -0.03805732727050781, -0.03643512725830078, -0.03481292724609375, -0.03319072723388672, -0.03156852722167969, -0.029946327209472656, -0.028324127197265625, -0.026701927185058594, -0.025079727172851562, -0.02345752716064453, -0.0218353271484375, -0.02021312713623047, -0.018590927124023438, -0.016968727111816406, -0.015346527099609375, -0.013724327087402344, -0.012102127075195312, -0.010479927062988281, -0.00885772705078125, -0.007235527038574219, -0.0056133270263671875, -0.003991127014160156, -0.002368927001953125, -0.0007467269897460938, 0.0008754730224609375, 0.0024976730346679688, 0.004119873046875, 0.005742073059082031, 0.0073642730712890625, 0.008986473083496094, 0.010608673095703125, 0.012230873107910156, 0.013853073120117188, 0.015475273132324219, 0.01709747314453125, 0.01871967315673828, 0.020341873168945312, 0.021964073181152344, 0.023586273193359375, 0.025208473205566406, 0.026830673217773438, 0.02845287322998047, 0.0300750732421875, 0.03169727325439453, 0.03331947326660156, 0.034941673278808594, 0.036563873291015625, 0.038186073303222656, 0.03980827331542969, 0.04143047332763672, 0.04305267333984375, 0.04467487335205078, 0.04629707336425781, 0.047919273376464844, 0.049541473388671875, 0.051163673400878906, 0.05278587341308594, 0.05440807342529297, 0.0560302734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 384.0, 629.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03326241672039032, -0.032689839601516724, -0.03211726248264313, -0.03154468536376953, -0.030972106382250786, -0.03039952926337719, -0.029826950281858444, -0.029254373162984848, -0.028681796044111252, -0.028109218925237656, -0.02753664180636406, -0.026964062824845314, -0.026391485705971718, -0.02581890858709812, -0.025246329605579376, -0.02467375248670578, -0.024101175367832184, -0.023528598248958588, -0.02295602113008499, -0.022383442148566246, -0.02181086502969265, -0.021238287910819054, -0.020665708929300308, -0.020093131810426712, -0.019520554691553116, -0.01894797757267952, -0.018375400453805923, -0.017802821472287178, -0.017230244353413582, -0.016657667234539986, -0.01608508825302124, -0.015512511134147644, -0.014939934015274048, -0.014367356896400452, -0.01379477884620428, -0.01322220079600811, -0.012649623677134514, -0.012077046558260918, -0.011504468508064747, -0.010931890457868576, -0.01035931333899498, -0.009786736220121384, -0.009214158169925213, -0.008641580119729042, -0.008069003000855446, -0.007496425416320562, -0.006923847831785679, -0.006351270247250795, -0.005778692662715912, -0.005206115078181028, -0.004633537493646145, -0.004060959909111261, -0.003488382324576378, -0.0029158047400414944, -0.002343227155506611, -0.0017706495709717274, -0.0011980719864368439, -0.0006254944019019604, -5.2916817367076874e-05, 0.0005196607671678066, 0.0010922383517026901, 0.0016648159362375736, 0.002237393520772457, 0.0028099711053073406, 0.003382548689842224]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 4.0, 2.0, 4.0, 12.0, 9.0, 15.0, 9.0, 19.0, 14.0, 27.0, 24.0, 23.0, 26.0, 26.0, 37.0, 28.0, 42.0, 32.0, 36.0, 51.0, 32.0, 31.0, 34.0, 34.0, 43.0, 31.0, 46.0, 34.0, 32.0, 39.0, 25.0, 24.0, 25.0, 22.0, 14.0, 11.0, 20.0, 13.0, 9.0, 3.0, 4.0, 4.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011951327323913574, -0.0011548642069101334, -0.0011145956814289093, -0.0010743271559476852, -0.0010340586304664612, -0.0009937901049852371, -0.0009535215795040131, -0.000913253054022789, -0.0008729845285415649, -0.0008327160030603409, -0.0007924474775791168, -0.0007521789520978928, -0.0007119104266166687, -0.0006716419011354446, -0.0006313733756542206, -0.0005911048501729965, -0.0005508363246917725, -0.0005105677992105484, -0.00047029927372932434, -0.0004300307482481003, -0.0003897622227668762, -0.00034949369728565216, -0.0003092251718044281, -0.00026895664632320404, -0.00022868812084197998, -0.00018841959536075592, -0.00014815106987953186, -0.0001078825443983078, -6.761401891708374e-05, -2.734549343585968e-05, 1.292303204536438e-05, 5.319155752658844e-05, 9.34600830078125e-05, 0.00013372860848903656, 0.00017399713397026062, 0.00021426565945148468, 0.00025453418493270874, 0.0002948027104139328, 0.00033507123589515686, 0.0003753397613763809, 0.000415608286857605, 0.00045587681233882904, 0.0004961453378200531, 0.0005364138633012772, 0.0005766823887825012, 0.0006169509142637253, 0.0006572194397449493, 0.0006974879652261734, 0.0007377564907073975, 0.0007780250161886215, 0.0008182935416698456, 0.0008585620671510696, 0.0008988305926322937, 0.0009390991181135178, 0.0009793676435947418, 0.0010196361690759659, 0.00105990469455719, 0.001100173220038414, 0.001140441745519638, 0.0011807102710008621, 0.0012209787964820862, 0.0012612473219633102, 0.0013015158474445343, 0.0013417843729257584, 0.0013820528984069824]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 8.0, 10.0, 7.0, 9.0, 13.0, 24.0, 21.0, 30.0, 20.0, 21.0, 35.0, 33.0, 20.0, 28.0, 37.0, 33.0, 40.0, 31.0, 38.0, 44.0, 52.0, 34.0, 35.0, 41.0, 36.0, 26.0, 29.0, 32.0, 32.0, 26.0, 17.0, 22.0, 12.0, 13.0, 13.0, 17.0, 6.0, 9.0, 8.0, 0.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.98828125, -7.74749755859375, -7.5067138671875, -7.26593017578125, -7.025146484375, -6.78436279296875, -6.5435791015625, -6.30279541015625, -6.06201171875, -5.82122802734375, -5.5804443359375, -5.33966064453125, -5.098876953125, -4.85809326171875, -4.6173095703125, -4.37652587890625, -4.1357421875, -3.89495849609375, -3.6541748046875, -3.41339111328125, -3.172607421875, -2.93182373046875, -2.6910400390625, -2.45025634765625, -2.20947265625, -1.96868896484375, -1.7279052734375, -1.48712158203125, -1.246337890625, -1.00555419921875, -0.7647705078125, -0.52398681640625, -0.283203125, -0.04241943359375, 0.1983642578125, 0.43914794921875, 0.679931640625, 0.92071533203125, 1.1614990234375, 1.40228271484375, 1.64306640625, 1.88385009765625, 2.1246337890625, 2.36541748046875, 2.606201171875, 2.84698486328125, 3.0877685546875, 3.32855224609375, 3.5693359375, 3.81011962890625, 4.0509033203125, 4.29168701171875, 4.532470703125, 4.77325439453125, 5.0140380859375, 5.25482177734375, 5.49560546875, 5.73638916015625, 5.9771728515625, 6.21795654296875, 6.458740234375, 6.69952392578125, 6.9403076171875, 7.18109130859375, 7.421875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 10.0, 17.0, 21.0, 24.0, 27.0, 33.0, 48.0, 74.0, 63.0, 111.0, 139.0, 211.0, 332.0, 493.0, 843.0, 1348.0, 2466.0, 4636.0, 9339.0, 20285.0, 50197.0, 149602.0, 449801.0, 233637.0, 71506.0, 27493.0, 12309.0, 5860.0, 3127.0, 1719.0, 962.0, 597.0, 333.0, 265.0, 149.0, 127.0, 83.0, 65.0, 43.0, 36.0, 30.0, 23.0, 16.0, 13.0, 10.0, 12.0, 6.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.0, -9.6939697265625, -9.387939453125, -9.0819091796875, -8.77587890625, -8.4698486328125, -8.163818359375, -7.8577880859375, -7.5517578125, -7.2457275390625, -6.939697265625, -6.6336669921875, -6.32763671875, -6.0216064453125, -5.715576171875, -5.4095458984375, -5.103515625, -4.7974853515625, -4.491455078125, -4.1854248046875, -3.87939453125, -3.5733642578125, -3.267333984375, -2.9613037109375, -2.6552734375, -2.3492431640625, -2.043212890625, -1.7371826171875, -1.43115234375, -1.1251220703125, -0.819091796875, -0.5130615234375, -0.20703125, 0.0989990234375, 0.405029296875, 0.7110595703125, 1.01708984375, 1.3231201171875, 1.629150390625, 1.9351806640625, 2.2412109375, 2.5472412109375, 2.853271484375, 3.1593017578125, 3.46533203125, 3.7713623046875, 4.077392578125, 4.3834228515625, 4.689453125, 4.9954833984375, 5.301513671875, 5.6075439453125, 5.91357421875, 6.2196044921875, 6.525634765625, 6.8316650390625, 7.1376953125, 7.4437255859375, 7.749755859375, 8.0557861328125, 8.36181640625, 8.6678466796875, 8.973876953125, 9.2799072265625, 9.5859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 9.0, 7.0, 9.0, 12.0, 9.0, 14.0, 19.0, 9.0, 21.0, 21.0, 27.0, 25.0, 31.0, 30.0, 32.0, 31.0, 50.0, 60.0, 95.0, 129.0, 1395.0, 350.0, 137.0, 83.0, 63.0, 36.0, 50.0, 39.0, 34.0, 26.0, 34.0, 26.0, 15.0, 18.0, 15.0, 14.0, 13.0, 9.0, 8.0, 10.0, 6.0, 3.0, 5.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-23.625, -22.949951171875, -22.27490234375, -21.599853515625, -20.9248046875, -20.249755859375, -19.57470703125, -18.899658203125, -18.224609375, -17.549560546875, -16.87451171875, -16.199462890625, -15.5244140625, -14.849365234375, -14.17431640625, -13.499267578125, -12.82421875, -12.149169921875, -11.47412109375, -10.799072265625, -10.1240234375, -9.448974609375, -8.77392578125, -8.098876953125, -7.423828125, -6.748779296875, -6.07373046875, -5.398681640625, -4.7236328125, -4.048583984375, -3.37353515625, -2.698486328125, -2.0234375, -1.348388671875, -0.67333984375, 0.001708984375, 0.6767578125, 1.351806640625, 2.02685546875, 2.701904296875, 3.376953125, 4.052001953125, 4.72705078125, 5.402099609375, 6.0771484375, 6.752197265625, 7.42724609375, 8.102294921875, 8.77734375, 9.452392578125, 10.12744140625, 10.802490234375, 11.4775390625, 12.152587890625, 12.82763671875, 13.502685546875, 14.177734375, 14.852783203125, 15.52783203125, 16.202880859375, 16.8779296875, 17.552978515625, 18.22802734375, 18.903076171875, 19.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 11.0, 18.0, 18.0, 22.0, 26.0, 41.0, 64.0, 73.0, 112.0, 130.0, 187.0, 335.0, 663.0, 2539.0, 29079.0, 2437870.0, 655548.0, 15727.0, 1681.0, 533.0, 278.0, 220.0, 134.0, 81.0, 78.0, 60.0, 31.0, 31.0, 19.0, 22.0, 11.0, 9.0, 13.0, 9.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.5517578125, -31.384765625, -30.2177734375, -29.05078125, -27.8837890625, -26.716796875, -25.5498046875, -24.3828125, -23.2158203125, -22.048828125, -20.8818359375, -19.71484375, -18.5478515625, -17.380859375, -16.2138671875, -15.046875, -13.8798828125, -12.712890625, -11.5458984375, -10.37890625, -9.2119140625, -8.044921875, -6.8779296875, -5.7109375, -4.5439453125, -3.376953125, -2.2099609375, -1.04296875, 0.1240234375, 1.291015625, 2.4580078125, 3.625, 4.7919921875, 5.958984375, 7.1259765625, 8.29296875, 9.4599609375, 10.626953125, 11.7939453125, 12.9609375, 14.1279296875, 15.294921875, 16.4619140625, 17.62890625, 18.7958984375, 19.962890625, 21.1298828125, 22.296875, 23.4638671875, 24.630859375, 25.7978515625, 26.96484375, 28.1318359375, 29.298828125, 30.4658203125, 31.6328125, 32.7998046875, 33.966796875, 35.1337890625, 36.30078125, 37.4677734375, 38.634765625, 39.8017578125, 40.96875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 35.0, 796.0, 183.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.10650634765625, -46.885040283203125, -38.663578033447266, -30.442113876342773, -22.22064971923828, -13.999183654785156, -5.777721405029297, 2.4437408447265625, 10.665206909179688, 18.88667106628418, 27.108135223388672, 35.32959747314453, 43.551063537597656, 51.77252960205078, 59.99399185180664, 68.2154541015625, 76.43692016601562, 84.65838623046875, 92.87985229492188, 101.10131072998047, 109.3227767944336, 117.54424285888672, 125.76570129394531, 133.98716735839844, 142.20863342285156, 150.4300994873047, 158.6515655517578, 166.87303161621094, 175.094482421875, 183.31594848632812, 191.53741455078125, 199.75888061523438, 207.98031616210938, 216.2017822265625, 224.42324829101562, 232.64471435546875, 240.86618041992188, 249.087646484375, 257.3091125488281, 265.53057861328125, 273.75201416015625, 281.9734802246094, 290.1949462890625, 298.4164123535156, 306.63787841796875, 314.8593444824219, 323.080810546875, 331.30224609375, 339.52374267578125, 347.7452087402344, 355.9666748046875, 364.1881408691406, 372.40960693359375, 380.6310729980469, 388.8525390625, 397.073974609375, 405.29547119140625, 413.5169372558594, 421.7384033203125, 429.9598693847656, 438.18133544921875, 446.4028015136719, 454.624267578125, 462.845703125, 471.0671691894531]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 6.0, 9.0, 8.0, 7.0, 9.0, 16.0, 22.0, 11.0, 21.0, 20.0, 29.0, 26.0, 31.0, 35.0, 44.0, 37.0, 35.0, 49.0, 52.0, 44.0, 39.0, 52.0, 41.0, 40.0, 39.0, 33.0, 30.0, 29.0, 33.0, 22.0, 19.0, 20.0, 15.0, 14.0, 12.0, 8.0, 9.0, 9.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.40476608276367, -55.64702224731445, -53.88927459716797, -52.13153076171875, -50.373783111572266, -48.61603927612305, -46.85829162597656, -45.100547790527344, -43.342803955078125, -41.585060119628906, -39.82731246948242, -38.0695686340332, -36.31182098388672, -34.5540771484375, -32.79633331298828, -31.038585662841797, -29.280838012695312, -27.52309226989746, -25.76534652709961, -24.00760269165039, -22.249855041503906, -20.492111206054688, -18.734365463256836, -16.976619720458984, -15.218873977661133, -13.461128234863281, -11.70338249206543, -9.945637702941895, -8.187891960144043, -6.430146217346191, -4.672401428222656, -2.9146556854248047, -1.1569061279296875, 0.600839376449585, 2.3585848808288574, 4.116330146789551, 5.874075889587402, 7.631821632385254, 9.389566421508789, 11.14731216430664, 12.905057907104492, 14.662803649902344, 16.420549392700195, 18.178295135498047, 19.936038970947266, 21.69378662109375, 23.45153045654297, 25.20927619934082, 26.967021942138672, 28.724767684936523, 30.482513427734375, 32.240257263183594, 33.99800491333008, 35.7557487487793, 37.51349639892578, 39.271240234375, 41.02898406982422, 42.78672790527344, 44.54447555541992, 46.30221939086914, 48.059967041015625, 49.817710876464844, 51.57545471191406, 53.33320236206055, 55.09095001220703]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 3.0, 12.0, 9.0, 21.0, 17.0, 19.0, 22.0, 25.0, 29.0, 23.0, 25.0, 33.0, 28.0, 46.0, 38.0, 41.0, 43.0, 43.0, 40.0, 47.0, 44.0, 44.0, 32.0, 27.0, 38.0, 37.0, 28.0, 26.0, 21.0, 33.0, 15.0, 22.0, 16.0, 13.0, 7.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.9339599609375, -8.656982421875, -8.3800048828125, -8.10302734375, -7.8260498046875, -7.549072265625, -7.2720947265625, -6.9951171875, -6.7181396484375, -6.441162109375, -6.1641845703125, -5.88720703125, -5.6102294921875, -5.333251953125, -5.0562744140625, -4.779296875, -4.5023193359375, -4.225341796875, -3.9483642578125, -3.67138671875, -3.3944091796875, -3.117431640625, -2.8404541015625, -2.5634765625, -2.2864990234375, -2.009521484375, -1.7325439453125, -1.45556640625, -1.1785888671875, -0.901611328125, -0.6246337890625, -0.34765625, -0.0706787109375, 0.206298828125, 0.4832763671875, 0.76025390625, 1.0372314453125, 1.314208984375, 1.5911865234375, 1.8681640625, 2.1451416015625, 2.422119140625, 2.6990966796875, 2.97607421875, 3.2530517578125, 3.530029296875, 3.8070068359375, 4.083984375, 4.3609619140625, 4.637939453125, 4.9149169921875, 5.19189453125, 5.4688720703125, 5.745849609375, 6.0228271484375, 6.2998046875, 6.5767822265625, 6.853759765625, 7.1307373046875, 7.40771484375, 7.6846923828125, 7.961669921875, 8.2386474609375, 8.515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 6.0, 10.0, 8.0, 13.0, 11.0, 20.0, 12.0, 32.0, 43.0, 57.0, 106.0, 182.0, 334.0, 834.0, 2442.0, 9080.0, 54723.0, 568365.0, 2512924.0, 937964.0, 88965.0, 12972.0, 3087.0, 1043.0, 459.0, 197.0, 125.0, 60.0, 44.0, 32.0, 13.0, 8.0, 11.0, 15.0, 17.0, 11.0, 13.0, 5.0, 7.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.515625, -15.0087890625, -14.501953125, -13.9951171875, -13.48828125, -12.9814453125, -12.474609375, -11.9677734375, -11.4609375, -10.9541015625, -10.447265625, -9.9404296875, -9.43359375, -8.9267578125, -8.419921875, -7.9130859375, -7.40625, -6.8994140625, -6.392578125, -5.8857421875, -5.37890625, -4.8720703125, -4.365234375, -3.8583984375, -3.3515625, -2.8447265625, -2.337890625, -1.8310546875, -1.32421875, -0.8173828125, -0.310546875, 0.1962890625, 0.703125, 1.2099609375, 1.716796875, 2.2236328125, 2.73046875, 3.2373046875, 3.744140625, 4.2509765625, 4.7578125, 5.2646484375, 5.771484375, 6.2783203125, 6.78515625, 7.2919921875, 7.798828125, 8.3056640625, 8.8125, 9.3193359375, 9.826171875, 10.3330078125, 10.83984375, 11.3466796875, 11.853515625, 12.3603515625, 12.8671875, 13.3740234375, 13.880859375, 14.3876953125, 14.89453125, 15.4013671875, 15.908203125, 16.4150390625, 16.921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 9.0, 10.0, 16.0, 16.0, 20.0, 33.0, 49.0, 64.0, 82.0, 119.0, 189.0, 310.0, 443.0, 542.0, 541.0, 484.0, 382.0, 236.0, 163.0, 105.0, 72.0, 48.0, 29.0, 25.0, 16.0, 15.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.953125, -15.5233154296875, -15.093505859375, -14.6636962890625, -14.23388671875, -13.8040771484375, -13.374267578125, -12.9444580078125, -12.5146484375, -12.0848388671875, -11.655029296875, -11.2252197265625, -10.79541015625, -10.3656005859375, -9.935791015625, -9.5059814453125, -9.076171875, -8.6463623046875, -8.216552734375, -7.7867431640625, -7.35693359375, -6.9271240234375, -6.497314453125, -6.0675048828125, -5.6376953125, -5.2078857421875, -4.778076171875, -4.3482666015625, -3.91845703125, -3.4886474609375, -3.058837890625, -2.6290283203125, -2.19921875, -1.7694091796875, -1.339599609375, -0.9097900390625, -0.47998046875, -0.0501708984375, 0.379638671875, 0.8094482421875, 1.2392578125, 1.6690673828125, 2.098876953125, 2.5286865234375, 2.95849609375, 3.3883056640625, 3.818115234375, 4.2479248046875, 4.677734375, 5.1075439453125, 5.537353515625, 5.9671630859375, 6.39697265625, 6.8267822265625, 7.256591796875, 7.6864013671875, 8.1162109375, 8.5460205078125, 8.975830078125, 9.4056396484375, 9.83544921875, 10.2652587890625, 10.695068359375, 11.1248779296875, 11.5546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 16.0, 24.0, 25.0, 37.0, 36.0, 77.0, 101.0, 189.0, 306.0, 592.0, 1266.0, 3140.0, 10246.0, 48035.0, 394895.0, 3131243.0, 528243.0, 58070.0, 11436.0, 3513.0, 1290.0, 606.0, 326.0, 158.0, 127.0, 73.0, 60.0, 39.0, 20.0, 18.0, 21.0, 11.0, 6.0, 6.0, 9.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.0, -23.324951171875, -22.64990234375, -21.974853515625, -21.2998046875, -20.624755859375, -19.94970703125, -19.274658203125, -18.599609375, -17.924560546875, -17.24951171875, -16.574462890625, -15.8994140625, -15.224365234375, -14.54931640625, -13.874267578125, -13.19921875, -12.524169921875, -11.84912109375, -11.174072265625, -10.4990234375, -9.823974609375, -9.14892578125, -8.473876953125, -7.798828125, -7.123779296875, -6.44873046875, -5.773681640625, -5.0986328125, -4.423583984375, -3.74853515625, -3.073486328125, -2.3984375, -1.723388671875, -1.04833984375, -0.373291015625, 0.3017578125, 0.976806640625, 1.65185546875, 2.326904296875, 3.001953125, 3.677001953125, 4.35205078125, 5.027099609375, 5.7021484375, 6.377197265625, 7.05224609375, 7.727294921875, 8.40234375, 9.077392578125, 9.75244140625, 10.427490234375, 11.1025390625, 11.777587890625, 12.45263671875, 13.127685546875, 13.802734375, 14.477783203125, 15.15283203125, 15.827880859375, 16.5029296875, 17.177978515625, 17.85302734375, 18.528076171875, 19.203125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 14.0, 148.0, 535.0, 279.0, 35.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-416.5489807128906, -409.1947021484375, -401.84039306640625, -394.4861145019531, -387.1318359375, -379.7775573730469, -372.4232482910156, -365.0689697265625, -357.7146911621094, -350.36041259765625, -343.006103515625, -335.6518249511719, -328.29754638671875, -320.9432678222656, -313.5889587402344, -306.23468017578125, -298.8804016113281, -291.526123046875, -284.17181396484375, -276.8175354003906, -269.4632568359375, -262.1089782714844, -254.7546844482422, -247.400390625, -240.0460968017578, -232.69180297851562, -225.3375244140625, -217.9832305908203, -210.6289520263672, -203.274658203125, -195.92037963867188, -188.5660858154297, -181.21182250976562, -173.85752868652344, -166.5032501220703, -159.14895629882812, -151.794677734375, -144.4403839111328, -137.0861053466797, -129.7318115234375, -122.37751770019531, -115.02323150634766, -107.6689453125, -100.31465911865234, -92.96037292480469, -85.6060791015625, -78.25180053710938, -70.89750671386719, -63.54322814941406, -56.188941955566406, -48.83465576171875, -41.480369567871094, -34.12608337402344, -26.771793365478516, -19.41750717163086, -12.063220977783203, -4.708934783935547, 2.6453518867492676, 9.999638557434082, 17.353925704956055, 24.70821189880371, 32.0625, 39.416786193847656, 46.77107238769531, 54.12535858154297]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 8.0, 7.0, 8.0, 9.0, 18.0, 13.0, 14.0, 19.0, 22.0, 20.0, 29.0, 18.0, 22.0, 32.0, 29.0, 23.0, 40.0, 33.0, 27.0, 39.0, 44.0, 31.0, 38.0, 33.0, 37.0, 33.0, 31.0, 31.0, 34.0, 29.0, 27.0, 22.0, 10.0, 13.0, 25.0, 17.0, 10.0, 15.0, 17.0, 6.0, 10.0, 10.0, 10.0, 6.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-40.50442886352539, -39.3116340637207, -38.118839263916016, -36.92604446411133, -35.733253479003906, -34.54045867919922, -33.34766387939453, -32.154869079589844, -30.962074279785156, -29.76927947998047, -28.57648468017578, -27.383691787719727, -26.19089698791504, -24.99810218811035, -23.805309295654297, -22.61251449584961, -21.419719696044922, -20.226924896240234, -19.034130096435547, -17.841337203979492, -16.648542404174805, -15.455747604370117, -14.262953758239746, -13.070159912109375, -11.877365112304688, -10.6845703125, -9.491776466369629, -8.298982620239258, -7.10618782043457, -5.913393497467041, -4.720599174499512, -3.5278053283691406, -2.3350067138671875, -1.1422123908996582, 0.050581932067871094, 1.2433762550354004, 2.4361705780029297, 3.628964900970459, 4.821759223937988, 6.014553070068359, 7.207347869873047, 8.400142669677734, 9.592936515808105, 10.785730361938477, 11.978525161743164, 13.171319961547852, 14.364113807678223, 15.556907653808594, 16.74970245361328, 17.94249725341797, 19.135292053222656, 20.32808494567871, 21.5208797454834, 22.713674545288086, 23.90646743774414, 25.099262237548828, 26.292057037353516, 27.484851837158203, 28.67764663696289, 29.870439529418945, 31.063234329223633, 32.25602722167969, 33.448822021484375, 34.64161682128906, 35.83441162109375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 7.0, 10.0, 23.0, 18.0, 15.0, 30.0, 27.0, 23.0, 30.0, 28.0, 38.0, 42.0, 44.0, 44.0, 36.0, 49.0, 47.0, 43.0, 36.0, 42.0, 45.0, 33.0, 31.0, 29.0, 27.0, 19.0, 19.0, 15.0, 19.0, 25.0, 21.0, 9.0, 11.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.566162109375, -7.28857421875, -7.010986328125, -6.7333984375, -6.455810546875, -6.17822265625, -5.900634765625, -5.623046875, -5.345458984375, -5.06787109375, -4.790283203125, -4.5126953125, -4.235107421875, -3.95751953125, -3.679931640625, -3.40234375, -3.124755859375, -2.84716796875, -2.569580078125, -2.2919921875, -2.014404296875, -1.73681640625, -1.459228515625, -1.181640625, -0.904052734375, -0.62646484375, -0.348876953125, -0.0712890625, 0.206298828125, 0.48388671875, 0.761474609375, 1.0390625, 1.316650390625, 1.59423828125, 1.871826171875, 2.1494140625, 2.427001953125, 2.70458984375, 2.982177734375, 3.259765625, 3.537353515625, 3.81494140625, 4.092529296875, 4.3701171875, 4.647705078125, 4.92529296875, 5.202880859375, 5.48046875, 5.758056640625, 6.03564453125, 6.313232421875, 6.5908203125, 6.868408203125, 7.14599609375, 7.423583984375, 7.701171875, 7.978759765625, 8.25634765625, 8.533935546875, 8.8115234375, 9.089111328125, 9.36669921875, 9.644287109375, 9.921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 9.0, 16.0, 24.0, 34.0, 46.0, 81.0, 94.0, 144.0, 253.0, 378.0, 598.0, 887.0, 1258.0, 2032.0, 2954.0, 4723.0, 7385.0, 12134.0, 19599.0, 32958.0, 56667.0, 97436.0, 157743.0, 206309.0, 173490.0, 110339.0, 64559.0, 37459.0, 22044.0, 13378.0, 8400.0, 5302.0, 3348.0, 2209.0, 1472.0, 927.0, 657.0, 436.0, 261.0, 158.0, 111.0, 84.0, 46.0, 35.0, 25.0, 10.0, 13.0, 14.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78369140625, -0.757232666015625, -0.73077392578125, -0.704315185546875, -0.6778564453125, -0.651397705078125, -0.62493896484375, -0.598480224609375, -0.572021484375, -0.545562744140625, -0.51910400390625, -0.492645263671875, -0.4661865234375, -0.439727783203125, -0.41326904296875, -0.386810302734375, -0.3603515625, -0.333892822265625, -0.30743408203125, -0.280975341796875, -0.2545166015625, -0.228057861328125, -0.20159912109375, -0.175140380859375, -0.148681640625, -0.122222900390625, -0.09576416015625, -0.069305419921875, -0.0428466796875, -0.016387939453125, 0.01007080078125, 0.036529541015625, 0.06298828125, 0.089447021484375, 0.11590576171875, 0.142364501953125, 0.1688232421875, 0.195281982421875, 0.22174072265625, 0.248199462890625, 0.274658203125, 0.301116943359375, 0.32757568359375, 0.354034423828125, 0.3804931640625, 0.406951904296875, 0.43341064453125, 0.459869384765625, 0.486328125, 0.512786865234375, 0.53924560546875, 0.565704345703125, 0.5921630859375, 0.618621826171875, 0.64508056640625, 0.671539306640625, 0.697998046875, 0.724456787109375, 0.75091552734375, 0.777374267578125, 0.8038330078125, 0.830291748046875, 0.85675048828125, 0.883209228515625, 0.90966796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 6.0, 7.0, 18.0, 12.0, 9.0, 19.0, 17.0, 17.0, 24.0, 25.0, 35.0, 29.0, 41.0, 33.0, 46.0, 46.0, 56.0, 32.0, 1072.0, 35.0, 39.0, 46.0, 46.0, 34.0, 29.0, 36.0, 36.0, 33.0, 27.0, 20.0, 23.0, 10.0, 11.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-6.69140625, -6.50347900390625, -6.3155517578125, -6.12762451171875, -5.939697265625, -5.75177001953125, -5.5638427734375, -5.37591552734375, -5.18798828125, -5.00006103515625, -4.8121337890625, -4.62420654296875, -4.436279296875, -4.24835205078125, -4.0604248046875, -3.87249755859375, -3.6845703125, -3.49664306640625, -3.3087158203125, -3.12078857421875, -2.932861328125, -2.74493408203125, -2.5570068359375, -2.36907958984375, -2.18115234375, -1.99322509765625, -1.8052978515625, -1.61737060546875, -1.429443359375, -1.24151611328125, -1.0535888671875, -0.86566162109375, -0.677734375, -0.48980712890625, -0.3018798828125, -0.11395263671875, 0.073974609375, 0.26190185546875, 0.4498291015625, 0.63775634765625, 0.82568359375, 1.01361083984375, 1.2015380859375, 1.38946533203125, 1.577392578125, 1.76531982421875, 1.9532470703125, 2.14117431640625, 2.3291015625, 2.51702880859375, 2.7049560546875, 2.89288330078125, 3.080810546875, 3.26873779296875, 3.4566650390625, 3.64459228515625, 3.83251953125, 4.02044677734375, 4.2083740234375, 4.39630126953125, 4.584228515625, 4.77215576171875, 4.9600830078125, 5.14801025390625, 5.3359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 13.0, 16.0, 38.0, 51.0, 57.0, 94.0, 124.0, 238.0, 356.0, 578.0, 903.0, 1482.0, 2397.0, 3818.0, 6278.0, 10220.0, 17161.0, 28718.0, 49309.0, 82967.0, 132525.0, 219667.0, 1187876.0, 138006.0, 87300.0, 51636.0, 29875.0, 17840.0, 10750.0, 6457.0, 3956.0, 2364.0, 1463.0, 873.0, 614.0, 409.0, 260.0, 158.0, 100.0, 48.0, 48.0, 31.0, 16.0, 13.0, 10.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.634765625, -0.6136398315429688, -0.5925140380859375, -0.5713882446289062, -0.550262451171875, -0.5291366577148438, -0.5080108642578125, -0.48688507080078125, -0.46575927734375, -0.44463348388671875, -0.4235076904296875, -0.40238189697265625, -0.381256103515625, -0.36013031005859375, -0.3390045166015625, -0.31787872314453125, -0.2967529296875, -0.27562713623046875, -0.2545013427734375, -0.23337554931640625, -0.212249755859375, -0.19112396240234375, -0.1699981689453125, -0.14887237548828125, -0.12774658203125, -0.10662078857421875, -0.0854949951171875, -0.06436920166015625, -0.043243408203125, -0.02211761474609375, -0.0009918212890625, 0.02013397216796875, 0.041259765625, 0.06238555908203125, 0.0835113525390625, 0.10463714599609375, 0.125762939453125, 0.14688873291015625, 0.1680145263671875, 0.18914031982421875, 0.21026611328125, 0.23139190673828125, 0.2525177001953125, 0.27364349365234375, 0.294769287109375, 0.31589508056640625, 0.3370208740234375, 0.35814666748046875, 0.3792724609375, 0.40039825439453125, 0.4215240478515625, 0.44264984130859375, 0.463775634765625, 0.48490142822265625, 0.5060272216796875, 0.5271530151367188, 0.54827880859375, 0.5694046020507812, 0.5905303955078125, 0.6116561889648438, 0.632781982421875, 0.6539077758789062, 0.6750335693359375, 0.6961593627929688, 0.71728515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 9.0, 9.0, 11.0, 14.0, 21.0, 18.0, 22.0, 32.0, 43.0, 38.0, 47.0, 53.0, 54.0, 56.0, 54.0, 66.0, 58.0, 42.0, 42.0, 57.0, 40.0, 30.0, 27.0, 24.0, 23.0, 21.0, 16.0, 18.0, 6.0, 4.0, 6.0, 6.0, 5.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0026988983154296875, -0.0026188790798187256, -0.0025388598442077637, -0.0024588406085968018, -0.00237882137298584, -0.002298802137374878, -0.002218782901763916, -0.002138763666152954, -0.002058744430541992, -0.0019787251949310303, -0.0018987059593200684, -0.0018186867237091064, -0.0017386674880981445, -0.0016586482524871826, -0.0015786290168762207, -0.0014986097812652588, -0.0014185905456542969, -0.001338571310043335, -0.001258552074432373, -0.0011785328388214111, -0.0010985136032104492, -0.0010184943675994873, -0.0009384751319885254, -0.0008584558963775635, -0.0007784366607666016, -0.0006984174251556396, -0.0006183981895446777, -0.0005383789539337158, -0.0004583597183227539, -0.000378340482711792, -0.0002983212471008301, -0.00021830201148986816, -0.00013828277587890625, -5.8263540267944336e-05, 2.1755695343017578e-05, 0.00010177493095397949, 0.0001817941665649414, 0.0002618134021759033, 0.00034183263778686523, 0.00042185187339782715, 0.0005018711090087891, 0.000581890344619751, 0.0006619095802307129, 0.0007419288158416748, 0.0008219480514526367, 0.0009019672870635986, 0.0009819865226745605, 0.0010620057582855225, 0.0011420249938964844, 0.0012220442295074463, 0.0013020634651184082, 0.0013820827007293701, 0.001462101936340332, 0.001542121171951294, 0.0016221404075622559, 0.0017021596431732178, 0.0017821788787841797, 0.0018621981143951416, 0.0019422173500061035, 0.0020222365856170654, 0.0021022558212280273, 0.0021822750568389893, 0.002262294292449951, 0.002342313528060913, 0.002422332763671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 5.0, 6.0, 14.0, 11.0, 11.0, 12.0, 22.0, 21.0, 26.0, 34.0, 38.0, 52.0, 72.0, 77.0, 130.0, 168.0, 233.0, 465.0, 1179.0, 88304.0, 951278.0, 4715.0, 625.0, 336.0, 172.0, 134.0, 85.0, 86.0, 55.0, 33.0, 34.0, 23.0, 22.0, 20.0, 13.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044952392578125, -0.043415069580078125, -0.04187774658203125, -0.040340423583984375, -0.0388031005859375, -0.037265777587890625, -0.03572845458984375, -0.034191131591796875, -0.03265380859375, -0.031116485595703125, -0.02957916259765625, -0.028041839599609375, -0.0265045166015625, -0.024967193603515625, -0.02342987060546875, -0.021892547607421875, -0.020355224609375, -0.018817901611328125, -0.01728057861328125, -0.015743255615234375, -0.0142059326171875, -0.012668609619140625, -0.01113128662109375, -0.009593963623046875, -0.008056640625, -0.006519317626953125, -0.00498199462890625, -0.003444671630859375, -0.0019073486328125, -0.000370025634765625, 0.00116729736328125, 0.002704620361328125, 0.004241943359375, 0.005779266357421875, 0.00731658935546875, 0.008853912353515625, 0.0103912353515625, 0.011928558349609375, 0.01346588134765625, 0.015003204345703125, 0.01654052734375, 0.018077850341796875, 0.01961517333984375, 0.021152496337890625, 0.0226898193359375, 0.024227142333984375, 0.02576446533203125, 0.027301788330078125, 0.028839111328125, 0.030376434326171875, 0.03191375732421875, 0.033451080322265625, 0.0349884033203125, 0.036525726318359375, 0.03806304931640625, 0.039600372314453125, 0.0411376953125, 0.042675018310546875, 0.04421234130859375, 0.045749664306640625, 0.0472869873046875, 0.048824310302734375, 0.05036163330078125, 0.051898956298828125, 0.053436279296875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 434.0, 582.0], "bins": [-0.04661134257912636, -0.04587218165397644, -0.04513302072882652, -0.044393859803676605, -0.04365469887852669, -0.04291553795337677, -0.04217637702822685, -0.041437216103076935, -0.04069805517792702, -0.0399588942527771, -0.03921973332762718, -0.038480572402477264, -0.03774141147732735, -0.03700225055217743, -0.03626308962702751, -0.035523928701877594, -0.034784767776727676, -0.03404560685157776, -0.03330644592642784, -0.032567285001277924, -0.031828124076128006, -0.03108896315097809, -0.03034980222582817, -0.029610641300678253, -0.028871482238173485, -0.028132321313023567, -0.02739316038787365, -0.026653999462723732, -0.025914838537573814, -0.025175677612423897, -0.02443651668727398, -0.02369735576212406, -0.022958194836974144, -0.022219033911824226, -0.02147987298667431, -0.02074071206152439, -0.020001551136374474, -0.019262390211224556, -0.01852322928607464, -0.01778406836092472, -0.017044909298419952, -0.016305748373270035, -0.015566587448120117, -0.0148274265229702, -0.014088265597820282, -0.013349104672670364, -0.012609943747520447, -0.01187078282237053, -0.011131621897220612, -0.010392460972070694, -0.009653300046920776, -0.008914139121770859, -0.008174978196620941, -0.0074358172714710236, -0.006696656811982393, -0.005957495886832476, -0.005218334496021271, -0.004479173570871353, -0.0037400126457214355, -0.0030008519534021616, -0.002261691028252244, -0.0015225301031023264, -0.0007833694107830524, -4.420848563313484e-05, 0.0006949523231014609]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 13.0, 11.0, 20.0, 19.0, 22.0, 35.0, 36.0, 34.0, 43.0, 44.0, 55.0, 59.0, 52.0, 55.0, 61.0, 53.0, 50.0, 62.0, 38.0, 39.0, 45.0, 27.0, 38.0, 16.0, 18.0, 7.0, 6.0, 14.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015953779220581055, -0.0015363981947302818, -0.0014774184674024582, -0.0014184387400746346, -0.001359459012746811, -0.0013004792854189873, -0.0012414995580911636, -0.00118251983076334, -0.0011235401034355164, -0.0010645603761076927, -0.001005580648779869, -0.0009466009214520454, -0.0008876211941242218, -0.0008286414667963982, -0.0007696617394685745, -0.0007106820121407509, -0.0006517022848129272, -0.0005927225574851036, -0.00053374283015728, -0.00047476310282945633, -0.0004157833755016327, -0.00035680364817380905, -0.0002978239208459854, -0.00023884419351816177, -0.00017986446619033813, -0.0001208847388625145, -6.190501153469086e-05, -2.925284206867218e-06, 5.605444312095642e-05, 0.00011503417044878006, 0.0001740138977766037, 0.00023299362510442734, 0.000291973352432251, 0.0003509530797600746, 0.00040993280708789825, 0.0004689125344157219, 0.0005278922617435455, 0.0005868719890713692, 0.0006458517163991928, 0.0007048314437270164, 0.0007638111710548401, 0.0008227908983826637, 0.0008817706257104874, 0.000940750353038311, 0.0009997300803661346, 0.0010587098076939583, 0.001117689535021782, 0.0011766692623496056, 0.0012356489896774292, 0.0012946287170052528, 0.0013536084443330765, 0.0014125881716609001, 0.0014715678989887238, 0.0015305476263165474, 0.001589527353644371, 0.0016485070809721947, 0.0017074868083000183, 0.001766466535627842, 0.0018254462629556656, 0.0018844259902834892, 0.0019434057176113129, 0.0020023854449391365, 0.00206136517226696, 0.0021203448995947838, 0.0021793246269226074]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 7.0, 11.0, 22.0, 18.0, 16.0, 29.0, 27.0, 23.0, 31.0, 28.0, 37.0, 42.0, 44.0, 44.0, 36.0, 51.0, 45.0, 43.0, 36.0, 42.0, 45.0, 33.0, 31.0, 29.0, 27.0, 19.0, 19.0, 15.0, 19.0, 25.0, 21.0, 9.0, 11.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.56231689453125, -7.2847900390625, -7.00726318359375, -6.729736328125, -6.45220947265625, -6.1746826171875, -5.89715576171875, -5.61962890625, -5.34210205078125, -5.0645751953125, -4.78704833984375, -4.509521484375, -4.23199462890625, -3.9544677734375, -3.67694091796875, -3.3994140625, -3.12188720703125, -2.8443603515625, -2.56683349609375, -2.289306640625, -2.01177978515625, -1.7342529296875, -1.45672607421875, -1.17919921875, -0.90167236328125, -0.6241455078125, -0.34661865234375, -0.069091796875, 0.20843505859375, 0.4859619140625, 0.76348876953125, 1.041015625, 1.31854248046875, 1.5960693359375, 1.87359619140625, 2.151123046875, 2.42864990234375, 2.7061767578125, 2.98370361328125, 3.26123046875, 3.53875732421875, 3.8162841796875, 4.09381103515625, 4.371337890625, 4.64886474609375, 4.9263916015625, 5.20391845703125, 5.4814453125, 5.75897216796875, 6.0364990234375, 6.31402587890625, 6.591552734375, 6.86907958984375, 7.1466064453125, 7.42413330078125, 7.70166015625, 7.97918701171875, 8.2567138671875, 8.53424072265625, 8.811767578125, 9.08929443359375, 9.3668212890625, 9.64434814453125, 9.921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 7.0, 12.0, 12.0, 12.0, 13.0, 33.0, 48.0, 57.0, 76.0, 81.0, 130.0, 210.0, 271.0, 421.0, 692.0, 1219.0, 2407.0, 4815.0, 9886.0, 22445.0, 56483.0, 174371.0, 461528.0, 202373.0, 63764.0, 25030.0, 10966.0, 5005.0, 2619.0, 1402.0, 730.0, 457.0, 258.0, 208.0, 113.0, 101.0, 66.0, 63.0, 40.0, 26.0, 34.0, 26.0, 12.0, 6.0, 3.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0], "bins": [-12.0625, -11.7232666015625, -11.384033203125, -11.0447998046875, -10.70556640625, -10.3663330078125, -10.027099609375, -9.6878662109375, -9.3486328125, -9.0093994140625, -8.670166015625, -8.3309326171875, -7.99169921875, -7.6524658203125, -7.313232421875, -6.9739990234375, -6.634765625, -6.2955322265625, -5.956298828125, -5.6170654296875, -5.27783203125, -4.9385986328125, -4.599365234375, -4.2601318359375, -3.9208984375, -3.5816650390625, -3.242431640625, -2.9031982421875, -2.56396484375, -2.2247314453125, -1.885498046875, -1.5462646484375, -1.20703125, -0.8677978515625, -0.528564453125, -0.1893310546875, 0.14990234375, 0.4891357421875, 0.828369140625, 1.1676025390625, 1.5068359375, 1.8460693359375, 2.185302734375, 2.5245361328125, 2.86376953125, 3.2030029296875, 3.542236328125, 3.8814697265625, 4.220703125, 4.5599365234375, 4.899169921875, 5.2384033203125, 5.57763671875, 5.9168701171875, 6.256103515625, 6.5953369140625, 6.9345703125, 7.2738037109375, 7.613037109375, 7.9522705078125, 8.29150390625, 8.6307373046875, 8.969970703125, 9.3092041015625, 9.6484375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 1.0, 9.0, 5.0, 2.0, 8.0, 13.0, 15.0, 11.0, 18.0, 18.0, 30.0, 21.0, 32.0, 38.0, 38.0, 43.0, 45.0, 57.0, 100.0, 199.0, 1441.0, 312.0, 135.0, 67.0, 63.0, 48.0, 32.0, 39.0, 35.0, 29.0, 21.0, 19.0, 18.0, 14.0, 18.0, 10.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.515625, -24.7607421875, -24.005859375, -23.2509765625, -22.49609375, -21.7412109375, -20.986328125, -20.2314453125, -19.4765625, -18.7216796875, -17.966796875, -17.2119140625, -16.45703125, -15.7021484375, -14.947265625, -14.1923828125, -13.4375, -12.6826171875, -11.927734375, -11.1728515625, -10.41796875, -9.6630859375, -8.908203125, -8.1533203125, -7.3984375, -6.6435546875, -5.888671875, -5.1337890625, -4.37890625, -3.6240234375, -2.869140625, -2.1142578125, -1.359375, -0.6044921875, 0.150390625, 0.9052734375, 1.66015625, 2.4150390625, 3.169921875, 3.9248046875, 4.6796875, 5.4345703125, 6.189453125, 6.9443359375, 7.69921875, 8.4541015625, 9.208984375, 9.9638671875, 10.71875, 11.4736328125, 12.228515625, 12.9833984375, 13.73828125, 14.4931640625, 15.248046875, 16.0029296875, 16.7578125, 17.5126953125, 18.267578125, 19.0224609375, 19.77734375, 20.5322265625, 21.287109375, 22.0419921875, 22.796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 11.0, 15.0, 18.0, 18.0, 24.0, 37.0, 40.0, 65.0, 79.0, 108.0, 165.0, 241.0, 469.0, 1397.0, 13736.0, 2174485.0, 942061.0, 10293.0, 1154.0, 431.0, 262.0, 144.0, 131.0, 61.0, 56.0, 41.0, 39.0, 28.0, 21.0, 17.0, 8.0, 13.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.24755859375, -38.8076171875, -37.36767578125, -35.927734375, -34.48779296875, -33.0478515625, -31.60791015625, -30.16796875, -28.72802734375, -27.2880859375, -25.84814453125, -24.408203125, -22.96826171875, -21.5283203125, -20.08837890625, -18.6484375, -17.20849609375, -15.7685546875, -14.32861328125, -12.888671875, -11.44873046875, -10.0087890625, -8.56884765625, -7.12890625, -5.68896484375, -4.2490234375, -2.80908203125, -1.369140625, 0.07080078125, 1.5107421875, 2.95068359375, 4.390625, 5.83056640625, 7.2705078125, 8.71044921875, 10.150390625, 11.59033203125, 13.0302734375, 14.47021484375, 15.91015625, 17.35009765625, 18.7900390625, 20.22998046875, 21.669921875, 23.10986328125, 24.5498046875, 25.98974609375, 27.4296875, 28.86962890625, 30.3095703125, 31.74951171875, 33.189453125, 34.62939453125, 36.0693359375, 37.50927734375, 38.94921875, 40.38916015625, 41.8291015625, 43.26904296875, 44.708984375, 46.14892578125, 47.5888671875, 49.02880859375, 50.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 167.0, 832.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-475.1203308105469, -465.277587890625, -455.434814453125, -445.5920715332031, -435.74932861328125, -425.90655517578125, -416.0638122558594, -406.2210693359375, -396.3782958984375, -386.5355529785156, -376.6927795410156, -366.85003662109375, -357.0072937011719, -347.16455078125, -337.32177734375, -327.4790344238281, -317.63629150390625, -307.7935485839844, -297.9507751464844, -288.1080322265625, -278.2652893066406, -268.42254638671875, -258.57977294921875, -248.73703002929688, -238.89427185058594, -229.051513671875, -219.20877075195312, -209.3660125732422, -199.52325439453125, -189.68051147460938, -179.83775329589844, -169.9949951171875, -160.1522216796875, -150.30946350097656, -140.4667205810547, -130.62396240234375, -120.78121185302734, -110.93846130371094, -101.095703125, -91.2529525756836, -81.41020202636719, -71.56745147705078, -61.72469711303711, -51.88194274902344, -42.03919219970703, -32.196441650390625, -22.353687286376953, -12.510932922363281, -2.668182373046875, 7.174570083618164, 17.017322540283203, 26.860074996948242, 36.70282745361328, 46.54557800292969, 56.38833236694336, 66.23108673095703, 76.07383728027344, 85.91658782958984, 95.75933837890625, 105.60209655761719, 115.4448471069336, 125.28759765625, 135.13035583496094, 144.97311401367188, 154.81585693359375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 8.0, 5.0, 5.0, 6.0, 15.0, 17.0, 13.0, 19.0, 16.0, 20.0, 30.0, 24.0, 30.0, 26.0, 40.0, 30.0, 41.0, 37.0, 30.0, 40.0, 52.0, 36.0, 44.0, 29.0, 28.0, 45.0, 30.0, 35.0, 32.0, 29.0, 37.0, 14.0, 18.0, 23.0, 18.0, 14.0, 8.0, 12.0, 11.0, 3.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 2.0], "bins": [-61.60636901855469, -59.895355224609375, -58.1843376159668, -56.473323822021484, -54.762306213378906, -53.051292419433594, -51.34027862548828, -49.6292610168457, -47.918243408203125, -46.20722961425781, -44.496212005615234, -42.78519821166992, -41.074180603027344, -39.36316680908203, -37.65215301513672, -35.94113540649414, -34.23012161254883, -32.519107818603516, -30.808090209960938, -29.097076416015625, -27.386058807373047, -25.675045013427734, -23.96402931213379, -22.253013610839844, -20.5419979095459, -18.830982208251953, -17.119966506958008, -15.408951759338379, -13.697936058044434, -11.986920356750488, -10.27590560913086, -8.564889907836914, -6.853874206542969, -5.142858505249023, -3.4318432807922363, -1.7208280563354492, -0.009812355041503906, 1.7012033462524414, 3.4122180938720703, 5.123233795166016, 6.834249496459961, 8.545265197753906, 10.256280899047852, 11.96729564666748, 13.678311347961426, 15.389327049255371, 17.100341796875, 18.811357498168945, 20.52237319946289, 22.233388900756836, 23.94440460205078, 25.655418395996094, 27.366436004638672, 29.077449798583984, 30.78846549987793, 32.499481201171875, 34.21049499511719, 35.9215087890625, 37.63252639770508, 39.34354019165039, 41.05455780029297, 42.76557159423828, 44.476585388183594, 46.18760299682617, 47.89862060546875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 16.0, 21.0, 21.0, 16.0, 25.0, 29.0, 24.0, 27.0, 40.0, 34.0, 37.0, 50.0, 34.0, 49.0, 48.0, 44.0, 45.0, 43.0, 31.0, 42.0, 34.0, 24.0, 24.0, 31.0, 23.0, 19.0, 20.0, 14.0, 19.0, 9.0, 16.0, 17.0, 11.0, 11.0, 5.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0703125, -7.784423828125, -7.49853515625, -7.212646484375, -6.9267578125, -6.640869140625, -6.35498046875, -6.069091796875, -5.783203125, -5.497314453125, -5.21142578125, -4.925537109375, -4.6396484375, -4.353759765625, -4.06787109375, -3.781982421875, -3.49609375, -3.210205078125, -2.92431640625, -2.638427734375, -2.3525390625, -2.066650390625, -1.78076171875, -1.494873046875, -1.208984375, -0.923095703125, -0.63720703125, -0.351318359375, -0.0654296875, 0.220458984375, 0.50634765625, 0.792236328125, 1.078125, 1.364013671875, 1.64990234375, 1.935791015625, 2.2216796875, 2.507568359375, 2.79345703125, 3.079345703125, 3.365234375, 3.651123046875, 3.93701171875, 4.222900390625, 4.5087890625, 4.794677734375, 5.08056640625, 5.366455078125, 5.65234375, 5.938232421875, 6.22412109375, 6.510009765625, 6.7958984375, 7.081787109375, 7.36767578125, 7.653564453125, 7.939453125, 8.225341796875, 8.51123046875, 8.797119140625, 9.0830078125, 9.368896484375, 9.65478515625, 9.940673828125, 10.2265625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 11.0, 15.0, 8.0, 17.0, 15.0, 30.0, 31.0, 52.0, 49.0, 71.0, 95.0, 133.0, 167.0, 256.0, 320.0, 445.0, 1289.0, 4151022.0, 38082.0, 617.0, 411.0, 267.0, 201.0, 179.0, 109.0, 90.0, 62.0, 48.0, 37.0, 21.0, 20.0, 19.0, 21.0, 9.0, 18.0, 5.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-140.625, -136.19921875, -131.7734375, -127.34765625, -122.921875, -118.49609375, -114.0703125, -109.64453125, -105.21875, -100.79296875, -96.3671875, -91.94140625, -87.515625, -83.08984375, -78.6640625, -74.23828125, -69.8125, -65.38671875, -60.9609375, -56.53515625, -52.109375, -47.68359375, -43.2578125, -38.83203125, -34.40625, -29.98046875, -25.5546875, -21.12890625, -16.703125, -12.27734375, -7.8515625, -3.42578125, 1.0, 5.42578125, 9.8515625, 14.27734375, 18.703125, 23.12890625, 27.5546875, 31.98046875, 36.40625, 40.83203125, 45.2578125, 49.68359375, 54.109375, 58.53515625, 62.9609375, 67.38671875, 71.8125, 76.23828125, 80.6640625, 85.08984375, 89.515625, 93.94140625, 98.3671875, 102.79296875, 107.21875, 111.64453125, 116.0703125, 120.49609375, 124.921875, 129.34765625, 133.7734375, 138.19921875, 142.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 7.0, 11.0, 13.0, 25.0, 32.0, 36.0, 77.0, 92.0, 158.0, 229.0, 434.0, 698.0, 814.0, 594.0, 354.0, 183.0, 101.0, 70.0, 44.0, 26.0, 19.0, 22.0, 13.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.234375, -22.6427001953125, -22.051025390625, -21.4593505859375, -20.86767578125, -20.2760009765625, -19.684326171875, -19.0926513671875, -18.5009765625, -17.9093017578125, -17.317626953125, -16.7259521484375, -16.13427734375, -15.5426025390625, -14.950927734375, -14.3592529296875, -13.767578125, -13.1759033203125, -12.584228515625, -11.9925537109375, -11.40087890625, -10.8092041015625, -10.217529296875, -9.6258544921875, -9.0341796875, -8.4425048828125, -7.850830078125, -7.2591552734375, -6.66748046875, -6.0758056640625, -5.484130859375, -4.8924560546875, -4.30078125, -3.7091064453125, -3.117431640625, -2.5257568359375, -1.93408203125, -1.3424072265625, -0.750732421875, -0.1590576171875, 0.4326171875, 1.0242919921875, 1.615966796875, 2.2076416015625, 2.79931640625, 3.3909912109375, 3.982666015625, 4.5743408203125, 5.166015625, 5.7576904296875, 6.349365234375, 6.9410400390625, 7.53271484375, 8.1243896484375, 8.716064453125, 9.3077392578125, 9.8994140625, 10.4910888671875, 11.082763671875, 11.6744384765625, 12.26611328125, 12.8577880859375, 13.449462890625, 14.0411376953125, 14.6328125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 6.0, 5.0, 11.0, 7.0, 21.0, 28.0, 27.0, 35.0, 39.0, 58.0, 61.0, 147.0, 440.0, 4962.0, 3408358.0, 776647.0, 2627.0, 341.0, 120.0, 70.0, 51.0, 30.0, 32.0, 29.0, 26.0, 23.0, 22.0, 13.0, 9.0, 5.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0, -71.5263671875, -69.052734375, -66.5791015625, -64.10546875, -61.6318359375, -59.158203125, -56.6845703125, -54.2109375, -51.7373046875, -49.263671875, -46.7900390625, -44.31640625, -41.8427734375, -39.369140625, -36.8955078125, -34.421875, -31.9482421875, -29.474609375, -27.0009765625, -24.52734375, -22.0537109375, -19.580078125, -17.1064453125, -14.6328125, -12.1591796875, -9.685546875, -7.2119140625, -4.73828125, -2.2646484375, 0.208984375, 2.6826171875, 5.15625, 7.6298828125, 10.103515625, 12.5771484375, 15.05078125, 17.5244140625, 19.998046875, 22.4716796875, 24.9453125, 27.4189453125, 29.892578125, 32.3662109375, 34.83984375, 37.3134765625, 39.787109375, 42.2607421875, 44.734375, 47.2080078125, 49.681640625, 52.1552734375, 54.62890625, 57.1025390625, 59.576171875, 62.0498046875, 64.5234375, 66.9970703125, 69.470703125, 71.9443359375, 74.41796875, 76.8916015625, 79.365234375, 81.8388671875, 84.3125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 113.0, 471.0, 353.0, 58.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.155487060546875, -49.82224655151367, -43.48900604248047, -37.15576171875, -30.822521209716797, -24.489280700683594, -18.156036376953125, -11.822795867919922, -5.489555358886719, 0.8436861038208008, 7.17692756652832, 13.510169982910156, 19.84341049194336, 26.176651000976562, 32.50989532470703, 38.843135833740234, 45.17637634277344, 51.50961685180664, 57.842857360839844, 64.17610168457031, 70.50933837890625, 76.84258270263672, 83.17582702636719, 89.50906372070312, 95.8423080444336, 102.17555236816406, 108.5087890625, 114.84203338623047, 121.17527770996094, 127.50851440429688, 133.84176635742188, 140.1750030517578, 146.50823974609375, 152.8414764404297, 159.1747283935547, 165.50796508789062, 171.84120178222656, 178.1744384765625, 184.5076904296875, 190.84092712402344, 197.17416381835938, 203.5074005126953, 209.8406524658203, 216.17388916015625, 222.5071258544922, 228.84036254882812, 235.17361450195312, 241.50685119628906, 247.84010314941406, 254.17333984375, 260.506591796875, 266.83984375, 273.1730651855469, 279.5063171386719, 285.83953857421875, 292.17279052734375, 298.50604248046875, 304.83929443359375, 311.1725158691406, 317.5057678222656, 323.8390197753906, 330.1722412109375, 336.5054931640625, 342.8387451171875, 349.1719665527344]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 6.0, 13.0, 9.0, 12.0, 9.0, 6.0, 13.0, 27.0, 26.0, 16.0, 19.0, 29.0, 31.0, 34.0, 32.0, 42.0, 48.0, 35.0, 36.0, 46.0, 45.0, 48.0, 48.0, 31.0, 47.0, 37.0, 33.0, 27.0, 33.0, 23.0, 25.0, 24.0, 18.0, 12.0, 15.0, 7.0, 6.0, 6.0, 3.0, 9.0, 2.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.41960906982422, -42.93485641479492, -41.450103759765625, -39.96535110473633, -38.48059844970703, -36.99584197998047, -35.51108932495117, -34.026336669921875, -32.54158401489258, -31.05683135986328, -29.572078704833984, -28.087324142456055, -26.602571487426758, -25.11781883239746, -23.63306427001953, -22.148311614990234, -20.663558959960938, -19.17880630493164, -17.694053649902344, -16.209299087524414, -14.724546432495117, -13.23979377746582, -11.755040168762207, -10.270286560058594, -8.785533905029297, -7.300780773162842, -5.816027641296387, -4.331274509429932, -2.8465213775634766, -1.3617682456970215, 0.1229848861694336, 1.6077384948730469, 3.0924911499023438, 4.577244281768799, 6.061997413635254, 7.546750545501709, 9.031503677368164, 10.516256332397461, 12.001009941101074, 13.485763549804688, 14.970516204833984, 16.45526885986328, 17.940021514892578, 19.424776077270508, 20.909528732299805, 22.3942813873291, 23.87903594970703, 25.363788604736328, 26.848541259765625, 28.333293914794922, 29.81804656982422, 31.30280113220215, 32.78755187988281, 34.272308349609375, 35.75706100463867, 37.24181365966797, 38.726566314697266, 40.21131896972656, 41.69607162475586, 43.180824279785156, 44.66558074951172, 46.150333404541016, 47.63508605957031, 49.11983871459961, 50.604591369628906]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 5.0, 6.0, 13.0, 13.0, 4.0, 13.0, 17.0, 29.0, 25.0, 30.0, 30.0, 24.0, 28.0, 29.0, 36.0, 32.0, 30.0, 36.0, 39.0, 46.0, 39.0, 29.0, 37.0, 31.0, 38.0, 42.0, 31.0, 32.0, 23.0, 27.0, 20.0, 24.0, 29.0, 13.0, 8.0, 13.0, 19.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.71905517578125, -6.4810791015625, -6.24310302734375, -6.005126953125, -5.76715087890625, -5.5291748046875, -5.29119873046875, -5.05322265625, -4.81524658203125, -4.5772705078125, -4.33929443359375, -4.101318359375, -3.86334228515625, -3.6253662109375, -3.38739013671875, -3.1494140625, -2.91143798828125, -2.6734619140625, -2.43548583984375, -2.197509765625, -1.95953369140625, -1.7215576171875, -1.48358154296875, -1.24560546875, -1.00762939453125, -0.7696533203125, -0.53167724609375, -0.293701171875, -0.05572509765625, 0.1822509765625, 0.42022705078125, 0.658203125, 0.89617919921875, 1.1341552734375, 1.37213134765625, 1.610107421875, 1.84808349609375, 2.0860595703125, 2.32403564453125, 2.56201171875, 2.79998779296875, 3.0379638671875, 3.27593994140625, 3.513916015625, 3.75189208984375, 3.9898681640625, 4.22784423828125, 4.4658203125, 4.70379638671875, 4.9417724609375, 5.17974853515625, 5.417724609375, 5.65570068359375, 5.8936767578125, 6.13165283203125, 6.36962890625, 6.60760498046875, 6.8455810546875, 7.08355712890625, 7.321533203125, 7.55950927734375, 7.7974853515625, 8.03546142578125, 8.2734375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 6.0, 5.0, 20.0, 28.0, 41.0, 69.0, 117.0, 141.0, 214.0, 276.0, 388.0, 574.0, 845.0, 1153.0, 1665.0, 2547.0, 3487.0, 5266.0, 7530.0, 11058.0, 16420.0, 25176.0, 38406.0, 60293.0, 94081.0, 138881.0, 172731.0, 154177.0, 108959.0, 70272.0, 45261.0, 29019.0, 19027.0, 12726.0, 8629.0, 5869.0, 3999.0, 2844.0, 1994.0, 1330.0, 861.0, 666.0, 455.0, 335.0, 230.0, 147.0, 128.0, 80.0, 45.0, 21.0, 26.0, 12.0, 8.0, 5.0, 7.0, 6.0, 4.0], "bins": [-0.72705078125, -0.7054595947265625, -0.683868408203125, -0.6622772216796875, -0.64068603515625, -0.6190948486328125, -0.597503662109375, -0.5759124755859375, -0.5543212890625, -0.5327301025390625, -0.511138916015625, -0.4895477294921875, -0.46795654296875, -0.4463653564453125, -0.424774169921875, -0.4031829833984375, -0.381591796875, -0.3600006103515625, -0.338409423828125, -0.3168182373046875, -0.29522705078125, -0.2736358642578125, -0.252044677734375, -0.2304534912109375, -0.2088623046875, -0.1872711181640625, -0.165679931640625, -0.1440887451171875, -0.12249755859375, -0.1009063720703125, -0.079315185546875, -0.0577239990234375, -0.0361328125, -0.0145416259765625, 0.007049560546875, 0.0286407470703125, 0.05023193359375, 0.0718231201171875, 0.093414306640625, 0.1150054931640625, 0.1365966796875, 0.1581878662109375, 0.179779052734375, 0.2013702392578125, 0.22296142578125, 0.2445526123046875, 0.266143798828125, 0.2877349853515625, 0.309326171875, 0.3309173583984375, 0.352508544921875, 0.3740997314453125, 0.39569091796875, 0.4172821044921875, 0.438873291015625, 0.4604644775390625, 0.4820556640625, 0.5036468505859375, 0.525238037109375, 0.5468292236328125, 0.56842041015625, 0.5900115966796875, 0.611602783203125, 0.6331939697265625, 0.65478515625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 7.0, 3.0, 6.0, 6.0, 9.0, 12.0, 14.0, 19.0, 22.0, 22.0, 19.0, 27.0, 33.0, 40.0, 30.0, 33.0, 27.0, 56.0, 39.0, 35.0, 27.0, 1065.0, 49.0, 38.0, 31.0, 32.0, 24.0, 29.0, 25.0, 36.0, 25.0, 21.0, 29.0, 25.0, 16.0, 15.0, 8.0, 13.0, 11.0, 11.0, 8.0, 5.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-5.05859375, -4.9036865234375, -4.748779296875, -4.5938720703125, -4.43896484375, -4.2840576171875, -4.129150390625, -3.9742431640625, -3.8193359375, -3.6644287109375, -3.509521484375, -3.3546142578125, -3.19970703125, -3.0447998046875, -2.889892578125, -2.7349853515625, -2.580078125, -2.4251708984375, -2.270263671875, -2.1153564453125, -1.96044921875, -1.8055419921875, -1.650634765625, -1.4957275390625, -1.3408203125, -1.1859130859375, -1.031005859375, -0.8760986328125, -0.72119140625, -0.5662841796875, -0.411376953125, -0.2564697265625, -0.1015625, 0.0533447265625, 0.208251953125, 0.3631591796875, 0.51806640625, 0.6729736328125, 0.827880859375, 0.9827880859375, 1.1376953125, 1.2926025390625, 1.447509765625, 1.6024169921875, 1.75732421875, 1.9122314453125, 2.067138671875, 2.2220458984375, 2.376953125, 2.5318603515625, 2.686767578125, 2.8416748046875, 2.99658203125, 3.1514892578125, 3.306396484375, 3.4613037109375, 3.6162109375, 3.7711181640625, 3.926025390625, 4.0809326171875, 4.23583984375, 4.3907470703125, 4.545654296875, 4.7005615234375, 4.85546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 11.0, 11.0, 15.0, 42.0, 62.0, 97.0, 132.0, 192.0, 301.0, 475.0, 820.0, 1180.0, 1929.0, 3027.0, 4964.0, 7976.0, 13280.0, 21817.0, 35977.0, 59336.0, 97241.0, 147603.0, 1231987.0, 166181.0, 116391.0, 72711.0, 44165.0, 26928.0, 16257.0, 9819.0, 6141.0, 3704.0, 2395.0, 1446.0, 909.0, 581.0, 357.0, 245.0, 144.0, 84.0, 71.0, 47.0, 29.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.602752685546875, -0.58245849609375, -0.562164306640625, -0.5418701171875, -0.521575927734375, -0.50128173828125, -0.480987548828125, -0.460693359375, -0.440399169921875, -0.42010498046875, -0.399810791015625, -0.3795166015625, -0.359222412109375, -0.33892822265625, -0.318634033203125, -0.29833984375, -0.278045654296875, -0.25775146484375, -0.237457275390625, -0.2171630859375, -0.196868896484375, -0.17657470703125, -0.156280517578125, -0.135986328125, -0.115692138671875, -0.09539794921875, -0.075103759765625, -0.0548095703125, -0.034515380859375, -0.01422119140625, 0.006072998046875, 0.0263671875, 0.046661376953125, 0.06695556640625, 0.087249755859375, 0.1075439453125, 0.127838134765625, 0.14813232421875, 0.168426513671875, 0.188720703125, 0.209014892578125, 0.22930908203125, 0.249603271484375, 0.2698974609375, 0.290191650390625, 0.31048583984375, 0.330780029296875, 0.35107421875, 0.371368408203125, 0.39166259765625, 0.411956787109375, 0.4322509765625, 0.452545166015625, 0.47283935546875, 0.493133544921875, 0.513427734375, 0.533721923828125, 0.55401611328125, 0.574310302734375, 0.5946044921875, 0.614898681640625, 0.63519287109375, 0.655487060546875, 0.67578125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 9.0, 5.0, 9.0, 13.0, 17.0, 15.0, 19.0, 27.0, 21.0, 31.0, 41.0, 39.0, 46.0, 73.0, 57.0, 79.0, 53.0, 52.0, 52.0, 50.0, 36.0, 40.0, 38.0, 32.0, 20.0, 22.0, 13.0, 9.0, 8.0, 7.0, 7.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.0021162331104278564, -0.002039015293121338, -0.0019617974758148193, -0.0018845796585083008, -0.0018073618412017822, -0.0017301440238952637, -0.0016529262065887451, -0.0015757083892822266, -0.001498490571975708, -0.0014212727546691895, -0.001344054937362671, -0.0012668371200561523, -0.0011896193027496338, -0.0011124014854431152, -0.0010351836681365967, -0.0009579658508300781, -0.0008807480335235596, -0.000803530216217041, -0.0007263123989105225, -0.0006490945816040039, -0.0005718767642974854, -0.0004946589469909668, -0.00041744112968444824, -0.0003402233123779297, -0.00026300549507141113, -0.00018578767776489258, -0.00010856986045837402, -3.135204315185547e-05, 4.5865774154663086e-05, 0.00012308359146118164, 0.0002003014087677002, 0.00027751922607421875, 0.0003547370433807373, 0.00043195486068725586, 0.0005091726779937744, 0.000586390495300293, 0.0006636083126068115, 0.0007408261299133301, 0.0008180439472198486, 0.0008952617645263672, 0.0009724795818328857, 0.0010496973991394043, 0.0011269152164459229, 0.0012041330337524414, 0.00128135085105896, 0.0013585686683654785, 0.001435786485671997, 0.0015130043029785156, 0.0015902221202850342, 0.0016674399375915527, 0.0017446577548980713, 0.0018218755722045898, 0.0018990933895111084, 0.001976311206817627, 0.0020535290241241455, 0.002130746841430664, 0.0022079646587371826, 0.002285182476043701, 0.0023624002933502197, 0.0024396181106567383, 0.002516835927963257, 0.0025940537452697754, 0.002671271562576294, 0.0027484893798828125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 4.0, 8.0, 10.0, 6.0, 11.0, 21.0, 17.0, 15.0, 24.0, 28.0, 30.0, 50.0, 78.0, 98.0, 154.0, 210.0, 342.0, 641.0, 2834.0, 934348.0, 106747.0, 1268.0, 558.0, 313.0, 189.0, 128.0, 80.0, 67.0, 46.0, 38.0, 36.0, 35.0, 24.0, 15.0, 16.0, 14.0, 12.0, 11.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.05303955078125, -0.05151557922363281, -0.049991607666015625, -0.04846763610839844, -0.04694366455078125, -0.04541969299316406, -0.043895721435546875, -0.04237174987792969, -0.0408477783203125, -0.03932380676269531, -0.037799835205078125, -0.03627586364746094, -0.03475189208984375, -0.03322792053222656, -0.031703948974609375, -0.030179977416992188, -0.028656005859375, -0.027132034301757812, -0.025608062744140625, -0.024084091186523438, -0.02256011962890625, -0.021036148071289062, -0.019512176513671875, -0.017988204956054688, -0.0164642333984375, -0.014940261840820312, -0.013416290283203125, -0.011892318725585938, -0.01036834716796875, -0.008844375610351562, -0.007320404052734375, -0.0057964324951171875, -0.0042724609375, -0.0027484893798828125, -0.001224517822265625, 0.0002994537353515625, 0.00182342529296875, 0.0033473968505859375, 0.004871368408203125, 0.0063953399658203125, 0.0079193115234375, 0.009443283081054688, 0.010967254638671875, 0.012491226196289062, 0.01401519775390625, 0.015539169311523438, 0.017063140869140625, 0.018587112426757812, 0.020111083984375, 0.021635055541992188, 0.023159027099609375, 0.024682998657226562, 0.02620697021484375, 0.027730941772460938, 0.029254913330078125, 0.030778884887695312, 0.0323028564453125, 0.03382682800292969, 0.035350799560546875, 0.03687477111816406, 0.03839874267578125, 0.03992271423339844, 0.041446685791015625, 0.04297065734863281, 0.04449462890625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 15.0, 1003.0], "bins": [-0.06981678307056427, -0.06871691346168518, -0.06761705130338669, -0.0665171816945076, -0.0654173195362091, -0.06431744992733002, -0.06321758031845093, -0.062117718160152435, -0.061017848551273346, -0.059917982667684555, -0.058818116784095764, -0.057718247175216675, -0.056618381291627884, -0.05551851540803909, -0.0544186495244503, -0.05331878364086151, -0.05221891775727272, -0.05111905187368393, -0.05001918599009514, -0.04891931638121605, -0.04781945049762726, -0.04671958461403847, -0.045619718730449677, -0.044519852846860886, -0.043419986963272095, -0.042320121079683304, -0.04122025519609451, -0.040120385587215424, -0.03902051970362663, -0.03792065382003784, -0.03682078793644905, -0.03572092205286026, -0.03462105244398117, -0.03352118656039238, -0.03242132067680359, -0.0313214510679245, -0.03022158518433571, -0.029121719300746918, -0.028021853417158127, -0.026921987533569336, -0.025822117924690247, -0.024722252041101456, -0.023622384294867516, -0.022522518411278725, -0.021422650665044785, -0.020322784781455994, -0.019222918897867203, -0.018123053014278412, -0.017023185268044472, -0.01592331938445568, -0.01482345163822174, -0.01372358575463295, -0.012623718939721584, -0.011523852124810219, -0.010423986241221428, -0.009324119426310062, -0.008224252611398697, -0.007124385796487331, -0.006024519447237253, -0.004924653097987175, -0.0038247862830758095, -0.002724919468164444, -0.0016250531189143658, -0.0005251867696642876, 0.0005746795795857906]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 15.0, 9.0, 14.0, 35.0, 34.0, 46.0, 54.0, 74.0, 80.0, 81.0, 70.0, 94.0, 73.0, 61.0, 49.0, 43.0, 55.0, 36.0, 23.0, 19.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014673471450805664, -0.0013855146244168282, -0.00130368210375309, -0.0012218495830893517, -0.0011400170624256134, -0.0010581845417618752, -0.0009763520210981369, -0.0008945195004343987, -0.0008126869797706604, -0.0007308544591069221, -0.0006490219384431839, -0.0005671894177794456, -0.0004853568971157074, -0.00040352437645196915, -0.0003216918557882309, -0.00023985933512449265, -0.0001580268144607544, -7.619429379701614e-05, 5.638226866722107e-06, 8.747074753046036e-05, 0.0001693032681941986, 0.00025113578885793686, 0.0003329683095216751, 0.00041480083018541336, 0.0004966333508491516, 0.0005784658715128899, 0.0006602983921766281, 0.0007421309128403664, 0.0008239634335041046, 0.0009057959541678429, 0.0009876284748315811, 0.0010694609954953194, 0.0011512935161590576, 0.0012331260368227959, 0.0013149585574865341, 0.0013967910781502724, 0.0014786235988140106, 0.0015604561194777489, 0.0016422886401414871, 0.0017241211608052254, 0.0018059536814689636, 0.0018877862021327019, 0.00196961872279644, 0.0020514512434601784, 0.0021332837641239166, 0.002215116284787655, 0.002296948805451393, 0.0023787813261151314, 0.0024606138467788696, 0.002542446367442608, 0.002624278888106346, 0.0027061114087700844, 0.0027879439294338226, 0.002869776450097561, 0.002951608970761299, 0.0030334414914250374, 0.0031152740120887756, 0.003197106532752514, 0.003278939053416252, 0.0033607715740799904, 0.0034426040947437286, 0.003524436615407467, 0.003606269136071205, 0.0036881016567349434, 0.0037699341773986816]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 5.0, 6.0, 14.0, 12.0, 4.0, 13.0, 17.0, 29.0, 25.0, 30.0, 30.0, 24.0, 28.0, 29.0, 36.0, 32.0, 30.0, 36.0, 39.0, 46.0, 39.0, 30.0, 36.0, 31.0, 38.0, 42.0, 31.0, 32.0, 23.0, 27.0, 20.0, 24.0, 29.0, 13.0, 8.0, 13.0, 19.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.71905517578125, -6.4810791015625, -6.24310302734375, -6.005126953125, -5.76715087890625, -5.5291748046875, -5.29119873046875, -5.05322265625, -4.81524658203125, -4.5772705078125, -4.33929443359375, -4.101318359375, -3.86334228515625, -3.6253662109375, -3.38739013671875, -3.1494140625, -2.91143798828125, -2.6734619140625, -2.43548583984375, -2.197509765625, -1.95953369140625, -1.7215576171875, -1.48358154296875, -1.24560546875, -1.00762939453125, -0.7696533203125, -0.53167724609375, -0.293701171875, -0.05572509765625, 0.1822509765625, 0.42022705078125, 0.658203125, 0.89617919921875, 1.1341552734375, 1.37213134765625, 1.610107421875, 1.84808349609375, 2.0860595703125, 2.32403564453125, 2.56201171875, 2.79998779296875, 3.0379638671875, 3.27593994140625, 3.513916015625, 3.75189208984375, 3.9898681640625, 4.22784423828125, 4.4658203125, 4.70379638671875, 4.9417724609375, 5.17974853515625, 5.417724609375, 5.65570068359375, 5.8936767578125, 6.13165283203125, 6.36962890625, 6.60760498046875, 6.8455810546875, 7.08355712890625, 7.321533203125, 7.55950927734375, 7.7974853515625, 8.03546142578125, 8.2734375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 11.0, 11.0, 19.0, 27.0, 42.0, 41.0, 54.0, 72.0, 82.0, 108.0, 165.0, 189.0, 265.0, 340.0, 415.0, 561.0, 721.0, 1008.0, 1381.0, 2337.0, 5068.0, 15430.0, 62761.0, 278814.0, 487146.0, 140464.0, 32122.0, 8821.0, 3437.0, 1816.0, 1152.0, 863.0, 685.0, 450.0, 383.0, 286.0, 249.0, 185.0, 139.0, 93.0, 74.0, 54.0, 54.0, 41.0, 28.0, 22.0, 15.0, 10.0, 6.0, 6.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0], "bins": [-12.0390625, -11.654052734375, -11.26904296875, -10.884033203125, -10.4990234375, -10.114013671875, -9.72900390625, -9.343994140625, -8.958984375, -8.573974609375, -8.18896484375, -7.803955078125, -7.4189453125, -7.033935546875, -6.64892578125, -6.263916015625, -5.87890625, -5.493896484375, -5.10888671875, -4.723876953125, -4.3388671875, -3.953857421875, -3.56884765625, -3.183837890625, -2.798828125, -2.413818359375, -2.02880859375, -1.643798828125, -1.2587890625, -0.873779296875, -0.48876953125, -0.103759765625, 0.28125, 0.666259765625, 1.05126953125, 1.436279296875, 1.8212890625, 2.206298828125, 2.59130859375, 2.976318359375, 3.361328125, 3.746337890625, 4.13134765625, 4.516357421875, 4.9013671875, 5.286376953125, 5.67138671875, 6.056396484375, 6.44140625, 6.826416015625, 7.21142578125, 7.596435546875, 7.9814453125, 8.366455078125, 8.75146484375, 9.136474609375, 9.521484375, 9.906494140625, 10.29150390625, 10.676513671875, 11.0615234375, 11.446533203125, 11.83154296875, 12.216552734375, 12.6015625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0, 7.0, 6.0, 6.0, 10.0, 10.0, 19.0, 12.0, 20.0, 23.0, 28.0, 21.0, 30.0, 34.0, 42.0, 54.0, 73.0, 89.0, 167.0, 1550.0, 318.0, 84.0, 71.0, 51.0, 37.0, 49.0, 40.0, 37.0, 31.0, 26.0, 11.0, 20.0, 14.0, 13.0, 13.0, 10.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.216552734375, -17.47998046875, -16.743408203125, -16.0068359375, -15.270263671875, -14.53369140625, -13.797119140625, -13.060546875, -12.323974609375, -11.58740234375, -10.850830078125, -10.1142578125, -9.377685546875, -8.64111328125, -7.904541015625, -7.16796875, -6.431396484375, -5.69482421875, -4.958251953125, -4.2216796875, -3.485107421875, -2.74853515625, -2.011962890625, -1.275390625, -0.538818359375, 0.19775390625, 0.934326171875, 1.6708984375, 2.407470703125, 3.14404296875, 3.880615234375, 4.6171875, 5.353759765625, 6.09033203125, 6.826904296875, 7.5634765625, 8.300048828125, 9.03662109375, 9.773193359375, 10.509765625, 11.246337890625, 11.98291015625, 12.719482421875, 13.4560546875, 14.192626953125, 14.92919921875, 15.665771484375, 16.40234375, 17.138916015625, 17.87548828125, 18.612060546875, 19.3486328125, 20.085205078125, 20.82177734375, 21.558349609375, 22.294921875, 23.031494140625, 23.76806640625, 24.504638671875, 25.2412109375, 25.977783203125, 26.71435546875, 27.450927734375, 28.1875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 3.0, 4.0, 5.0, 10.0, 7.0, 16.0, 14.0, 20.0, 26.0, 32.0, 40.0, 51.0, 74.0, 93.0, 177.0, 239.0, 435.0, 879.0, 3144.0, 2950346.0, 186506.0, 1817.0, 653.0, 339.0, 209.0, 157.0, 86.0, 71.0, 56.0, 43.0, 32.0, 25.0, 20.0, 13.0, 9.0, 12.0, 6.0, 10.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-64.625, -62.595703125, -60.56640625, -58.537109375, -56.5078125, -54.478515625, -52.44921875, -50.419921875, -48.390625, -46.361328125, -44.33203125, -42.302734375, -40.2734375, -38.244140625, -36.21484375, -34.185546875, -32.15625, -30.126953125, -28.09765625, -26.068359375, -24.0390625, -22.009765625, -19.98046875, -17.951171875, -15.921875, -13.892578125, -11.86328125, -9.833984375, -7.8046875, -5.775390625, -3.74609375, -1.716796875, 0.3125, 2.341796875, 4.37109375, 6.400390625, 8.4296875, 10.458984375, 12.48828125, 14.517578125, 16.546875, 18.576171875, 20.60546875, 22.634765625, 24.6640625, 26.693359375, 28.72265625, 30.751953125, 32.78125, 34.810546875, 36.83984375, 38.869140625, 40.8984375, 42.927734375, 44.95703125, 46.986328125, 49.015625, 51.044921875, 53.07421875, 55.103515625, 57.1328125, 59.162109375, 61.19140625, 63.220703125, 65.25]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 20.0, 511.0, 468.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.58877563476562, -142.6553955078125, -134.72203063964844, -126.78865051269531, -118.85527801513672, -110.92190551757812, -102.988525390625, -95.0551528930664, -87.12178039550781, -79.18840789794922, -71.25503540039062, -63.3216552734375, -55.388282775878906, -47.45491027832031, -39.52153396606445, -31.588157653808594, -23.65478515625, -15.721410751342773, -7.788036346435547, 0.1453380584716797, 8.078712463378906, 16.0120849609375, 23.94546127319336, 31.87883758544922, 39.81221008300781, 47.745582580566406, 55.678958892822266, 63.612335205078125, 71.54570770263672, 79.47908020019531, 87.41246032714844, 95.34583282470703, 103.27920532226562, 111.21257781982422, 119.14595031738281, 127.07933044433594, 135.0126953125, 142.94607543945312, 150.87945556640625, 158.81283569335938, 166.74620056152344, 174.67958068847656, 182.61294555664062, 190.54632568359375, 198.47970581054688, 206.41307067871094, 214.34645080566406, 222.27981567382812, 230.21319580078125, 238.14657592773438, 246.07994079589844, 254.01332092285156, 261.9466857910156, 269.88006591796875, 277.8134460449219, 285.746826171875, 293.68017578125, 301.6135559082031, 309.54693603515625, 317.48028564453125, 325.4136657714844, 333.3470458984375, 341.2804260253906, 349.21380615234375, 357.1471862792969]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 2.0, 6.0, 3.0, 8.0, 2.0, 5.0, 6.0, 7.0, 8.0, 6.0, 17.0, 9.0, 19.0, 22.0, 29.0, 17.0, 17.0, 29.0, 25.0, 35.0, 43.0, 35.0, 33.0, 31.0, 43.0, 47.0, 39.0, 49.0, 33.0, 37.0, 38.0, 30.0, 27.0, 39.0, 29.0, 19.0, 19.0, 26.0, 25.0, 14.0, 12.0, 14.0, 14.0, 7.0, 6.0, 1.0, 11.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-50.74373245239258, -49.099422454833984, -47.45511245727539, -45.8108024597168, -44.1664924621582, -42.52218246459961, -40.87786865234375, -39.233558654785156, -37.58924865722656, -35.94493865966797, -34.300628662109375, -32.65631866455078, -31.012008666992188, -29.367698669433594, -27.723386764526367, -26.079076766967773, -24.434768676757812, -22.79045867919922, -21.146148681640625, -19.50183868408203, -17.857528686523438, -16.213218688964844, -14.568906784057617, -12.924596786499023, -11.28028678894043, -9.635976791381836, -7.991666316986084, -6.347355842590332, -4.703045845031738, -3.0587358474731445, -1.4144248962402344, 0.22988510131835938, 1.8741989135742188, 3.5185091495513916, 5.1628193855285645, 6.807129859924316, 8.45143985748291, 10.095749855041504, 11.740060806274414, 13.384370803833008, 15.028680801391602, 16.672990798950195, 18.31730079650879, 19.961612701416016, 21.60592269897461, 23.250232696533203, 24.894542694091797, 26.53885269165039, 28.183162689208984, 29.827472686767578, 31.471782684326172, 33.116092681884766, 34.76040267944336, 36.40471267700195, 38.04902648925781, 39.693336486816406, 41.337646484375, 42.981956481933594, 44.62626647949219, 46.27057647705078, 47.914886474609375, 49.55919647216797, 51.20350646972656, 52.847816467285156, 54.49212646484375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 6.0, 10.0, 10.0, 13.0, 9.0, 15.0, 16.0, 24.0, 31.0, 25.0, 35.0, 37.0, 34.0, 30.0, 34.0, 43.0, 39.0, 40.0, 44.0, 44.0, 46.0, 43.0, 30.0, 36.0, 33.0, 35.0, 34.0, 28.0, 28.0, 18.0, 18.0, 16.0, 24.0, 12.0, 11.0, 13.0, 6.0, 5.0, 0.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.8671875, -7.6116943359375, -7.356201171875, -7.1007080078125, -6.84521484375, -6.5897216796875, -6.334228515625, -6.0787353515625, -5.8232421875, -5.5677490234375, -5.312255859375, -5.0567626953125, -4.80126953125, -4.5457763671875, -4.290283203125, -4.0347900390625, -3.779296875, -3.5238037109375, -3.268310546875, -3.0128173828125, -2.75732421875, -2.5018310546875, -2.246337890625, -1.9908447265625, -1.7353515625, -1.4798583984375, -1.224365234375, -0.9688720703125, -0.71337890625, -0.4578857421875, -0.202392578125, 0.0531005859375, 0.30859375, 0.5640869140625, 0.819580078125, 1.0750732421875, 1.33056640625, 1.5860595703125, 1.841552734375, 2.0970458984375, 2.3525390625, 2.6080322265625, 2.863525390625, 3.1190185546875, 3.37451171875, 3.6300048828125, 3.885498046875, 4.1409912109375, 4.396484375, 4.6519775390625, 4.907470703125, 5.1629638671875, 5.41845703125, 5.6739501953125, 5.929443359375, 6.1849365234375, 6.4404296875, 6.6959228515625, 6.951416015625, 7.2069091796875, 7.46240234375, 7.7178955078125, 7.973388671875, 8.2288818359375, 8.484375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 6.0, 19.0, 20.0, 19.0, 28.0, 31.0, 61.0, 75.0, 95.0, 113.0, 199.0, 282.0, 410.0, 799.0, 1597.0, 4064.0, 15708.0, 115645.0, 1127391.0, 2446965.0, 424266.0, 42893.0, 8102.0, 2574.0, 1117.0, 581.0, 382.0, 225.0, 162.0, 104.0, 95.0, 64.0, 43.0, 38.0, 24.0, 23.0, 16.0, 5.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-19.75, -19.20556640625, -18.6611328125, -18.11669921875, -17.572265625, -17.02783203125, -16.4833984375, -15.93896484375, -15.39453125, -14.85009765625, -14.3056640625, -13.76123046875, -13.216796875, -12.67236328125, -12.1279296875, -11.58349609375, -11.0390625, -10.49462890625, -9.9501953125, -9.40576171875, -8.861328125, -8.31689453125, -7.7724609375, -7.22802734375, -6.68359375, -6.13916015625, -5.5947265625, -5.05029296875, -4.505859375, -3.96142578125, -3.4169921875, -2.87255859375, -2.328125, -1.78369140625, -1.2392578125, -0.69482421875, -0.150390625, 0.39404296875, 0.9384765625, 1.48291015625, 2.02734375, 2.57177734375, 3.1162109375, 3.66064453125, 4.205078125, 4.74951171875, 5.2939453125, 5.83837890625, 6.3828125, 6.92724609375, 7.4716796875, 8.01611328125, 8.560546875, 9.10498046875, 9.6494140625, 10.19384765625, 10.73828125, 11.28271484375, 11.8271484375, 12.37158203125, 12.916015625, 13.46044921875, 14.0048828125, 14.54931640625, 15.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 3.0, 7.0, 10.0, 13.0, 16.0, 33.0, 26.0, 42.0, 55.0, 79.0, 99.0, 113.0, 171.0, 184.0, 295.0, 395.0, 481.0, 538.0, 396.0, 283.0, 177.0, 144.0, 109.0, 96.0, 72.0, 64.0, 44.0, 39.0, 22.0, 12.0, 18.0, 12.0, 9.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.75, -12.29541015625, -11.8408203125, -11.38623046875, -10.931640625, -10.47705078125, -10.0224609375, -9.56787109375, -9.11328125, -8.65869140625, -8.2041015625, -7.74951171875, -7.294921875, -6.84033203125, -6.3857421875, -5.93115234375, -5.4765625, -5.02197265625, -4.5673828125, -4.11279296875, -3.658203125, -3.20361328125, -2.7490234375, -2.29443359375, -1.83984375, -1.38525390625, -0.9306640625, -0.47607421875, -0.021484375, 0.43310546875, 0.8876953125, 1.34228515625, 1.796875, 2.25146484375, 2.7060546875, 3.16064453125, 3.615234375, 4.06982421875, 4.5244140625, 4.97900390625, 5.43359375, 5.88818359375, 6.3427734375, 6.79736328125, 7.251953125, 7.70654296875, 8.1611328125, 8.61572265625, 9.0703125, 9.52490234375, 9.9794921875, 10.43408203125, 10.888671875, 11.34326171875, 11.7978515625, 12.25244140625, 12.70703125, 13.16162109375, 13.6162109375, 14.07080078125, 14.525390625, 14.97998046875, 15.4345703125, 15.88916015625, 16.34375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 5.0, 10.0, 32.0, 32.0, 57.0, 137.0, 300.0, 779.0, 2824.0, 37355.0, 3735650.0, 407688.0, 7108.0, 1399.0, 482.0, 210.0, 98.0, 51.0, 27.0, 12.0, 7.0, 11.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -58.197265625, -56.61328125, -55.029296875, -53.4453125, -51.861328125, -50.27734375, -48.693359375, -47.109375, -45.525390625, -43.94140625, -42.357421875, -40.7734375, -39.189453125, -37.60546875, -36.021484375, -34.4375, -32.853515625, -31.26953125, -29.685546875, -28.1015625, -26.517578125, -24.93359375, -23.349609375, -21.765625, -20.181640625, -18.59765625, -17.013671875, -15.4296875, -13.845703125, -12.26171875, -10.677734375, -9.09375, -7.509765625, -5.92578125, -4.341796875, -2.7578125, -1.173828125, 0.41015625, 1.994140625, 3.578125, 5.162109375, 6.74609375, 8.330078125, 9.9140625, 11.498046875, 13.08203125, 14.666015625, 16.25, 17.833984375, 19.41796875, 21.001953125, 22.5859375, 24.169921875, 25.75390625, 27.337890625, 28.921875, 30.505859375, 32.08984375, 33.673828125, 35.2578125, 36.841796875, 38.42578125, 40.009765625, 41.59375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 622.0, 390.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.78530883789062, -173.51446533203125, -144.2436065673828, -114.9727554321289, -85.701904296875, -56.431060791015625, -27.160202026367188, 2.11065673828125, 31.381500244140625, 60.65235137939453, 89.92320251464844, 119.19405364990234, 148.46490478515625, 177.73574829101562, 207.00660705566406, 236.2774658203125, 265.5483093261719, 294.81915283203125, 324.09002685546875, 353.3608703613281, 382.6317138671875, 411.9025573730469, 441.17340087890625, 470.44427490234375, 499.7151184082031, 528.9859619140625, 558.2568359375, 587.5276489257812, 616.7985229492188, 646.0693359375, 675.3402099609375, 704.611083984375, 733.8819580078125, 763.15283203125, 792.4236450195312, 821.6945190429688, 850.96533203125, 880.2362060546875, 909.507080078125, 938.7779541015625, 968.0487670898438, 997.3196411132812, 1026.5904541015625, 1055.861328125, 1085.1322021484375, 1114.403076171875, 1143.673828125, 1172.9447021484375, 1202.215576171875, 1231.4864501953125, 1260.75732421875, 1290.028076171875, 1319.2989501953125, 1348.56982421875, 1377.8406982421875, 1407.111572265625, 1436.38232421875, 1465.6531982421875, 1494.924072265625, 1524.19482421875, 1553.4656982421875, 1582.736572265625, 1612.0074462890625, 1641.2783203125, 1670.5491943359375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 12.0, 14.0, 6.0, 15.0, 27.0, 24.0, 43.0, 36.0, 45.0, 53.0, 63.0, 59.0, 73.0, 63.0, 74.0, 67.0, 69.0, 45.0, 42.0, 38.0, 35.0, 28.0, 18.0, 18.0, 6.0, 10.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-104.1339111328125, -101.5208740234375, -98.9078369140625, -96.2947998046875, -93.68177032470703, -91.06873321533203, -88.45569610595703, -85.84265899658203, -83.22962188720703, -80.61658477783203, -78.00354766845703, -75.39051818847656, -72.77748107910156, -70.16444396972656, -67.55140686035156, -64.93836975097656, -62.32533645629883, -59.71229934692383, -57.099266052246094, -54.486228942871094, -51.873191833496094, -49.260154724121094, -46.64712142944336, -44.03408432006836, -41.421051025390625, -38.808013916015625, -36.19498062133789, -33.58194351196289, -30.96890640258789, -28.355871200561523, -25.742835998535156, -23.129798889160156, -20.516761779785156, -17.90372657775879, -15.290689468383789, -12.677654266357422, -10.064618110656738, -7.451581954956055, -4.8385467529296875, -2.2255096435546875, 0.3875255584716797, 3.000561475753784, 5.613597393035889, 8.226633071899414, 10.839669227600098, 13.452705383300781, 16.06574058532715, 18.67877769470215, 21.291812896728516, 23.904848098754883, 26.517885208129883, 29.13092041015625, 31.74395751953125, 34.35699462890625, 36.970027923583984, 39.583065032958984, 42.19609832763672, 44.80913543701172, 47.42216873168945, 50.03520584106445, 52.64824295043945, 55.26127624511719, 57.87431335449219, 60.48735046386719, 63.10038757324219]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 11.0, 12.0, 12.0, 12.0, 18.0, 14.0, 21.0, 21.0, 28.0, 26.0, 40.0, 31.0, 30.0, 48.0, 40.0, 42.0, 39.0, 37.0, 34.0, 49.0, 36.0, 45.0, 38.0, 35.0, 29.0, 34.0, 34.0, 25.0, 18.0, 21.0, 24.0, 16.0, 16.0, 10.0, 12.0, 6.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.511962890625, -6.30908203125, -6.106201171875, -5.9033203125, -5.700439453125, -5.49755859375, -5.294677734375, -5.091796875, -4.888916015625, -4.68603515625, -4.483154296875, -4.2802734375, -4.077392578125, -3.87451171875, -3.671630859375, -3.46875, -3.265869140625, -3.06298828125, -2.860107421875, -2.6572265625, -2.454345703125, -2.25146484375, -2.048583984375, -1.845703125, -1.642822265625, -1.43994140625, -1.237060546875, -1.0341796875, -0.831298828125, -0.62841796875, -0.425537109375, -0.22265625, -0.019775390625, 0.18310546875, 0.385986328125, 0.5888671875, 0.791748046875, 0.99462890625, 1.197509765625, 1.400390625, 1.603271484375, 1.80615234375, 2.009033203125, 2.2119140625, 2.414794921875, 2.61767578125, 2.820556640625, 3.0234375, 3.226318359375, 3.42919921875, 3.632080078125, 3.8349609375, 4.037841796875, 4.24072265625, 4.443603515625, 4.646484375, 4.849365234375, 5.05224609375, 5.255126953125, 5.4580078125, 5.660888671875, 5.86376953125, 6.066650390625, 6.26953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 6.0, 11.0, 17.0, 24.0, 32.0, 47.0, 56.0, 86.0, 99.0, 154.0, 194.0, 267.0, 396.0, 547.0, 742.0, 1071.0, 1499.0, 2202.0, 3214.0, 4439.0, 6701.0, 9730.0, 14893.0, 23005.0, 35586.0, 56628.0, 89718.0, 137319.0, 174507.0, 161472.0, 115445.0, 74067.0, 46677.0, 29179.0, 19043.0, 12535.0, 8514.0, 5563.0, 3842.0, 2591.0, 1834.0, 1343.0, 912.0, 671.0, 465.0, 362.0, 251.0, 167.0, 124.0, 80.0, 70.0, 52.0, 43.0, 16.0, 21.0, 15.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-0.5263671875, -0.5092697143554688, -0.4921722412109375, -0.47507476806640625, -0.457977294921875, -0.44087982177734375, -0.4237823486328125, -0.40668487548828125, -0.38958740234375, -0.37248992919921875, -0.3553924560546875, -0.33829498291015625, -0.321197509765625, -0.30410003662109375, -0.2870025634765625, -0.26990509033203125, -0.2528076171875, -0.23571014404296875, -0.2186126708984375, -0.20151519775390625, -0.184417724609375, -0.16732025146484375, -0.1502227783203125, -0.13312530517578125, -0.11602783203125, -0.09893035888671875, -0.0818328857421875, -0.06473541259765625, -0.047637939453125, -0.03054046630859375, -0.0134429931640625, 0.00365447998046875, 0.020751953125, 0.03784942626953125, 0.0549468994140625, 0.07204437255859375, 0.089141845703125, 0.10623931884765625, 0.1233367919921875, 0.14043426513671875, 0.15753173828125, 0.17462921142578125, 0.1917266845703125, 0.20882415771484375, 0.225921630859375, 0.24301910400390625, 0.2601165771484375, 0.27721405029296875, 0.2943115234375, 0.31140899658203125, 0.3285064697265625, 0.34560394287109375, 0.362701416015625, 0.37979888916015625, 0.3968963623046875, 0.41399383544921875, 0.43109130859375, 0.44818878173828125, 0.4652862548828125, 0.48238372802734375, 0.499481201171875, 0.5165786743164062, 0.5336761474609375, 0.5507736206054688, 0.56787109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 4.0, 5.0, 7.0, 14.0, 8.0, 6.0, 11.0, 16.0, 10.0, 27.0, 22.0, 21.0, 20.0, 27.0, 28.0, 27.0, 34.0, 40.0, 40.0, 34.0, 39.0, 40.0, 1068.0, 34.0, 43.0, 47.0, 32.0, 34.0, 27.0, 38.0, 23.0, 35.0, 27.0, 22.0, 21.0, 22.0, 10.0, 14.0, 11.0, 5.0, 8.0, 5.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.890472412109375, -3.76531982421875, -3.640167236328125, -3.5150146484375, -3.389862060546875, -3.26470947265625, -3.139556884765625, -3.014404296875, -2.889251708984375, -2.76409912109375, -2.638946533203125, -2.5137939453125, -2.388641357421875, -2.26348876953125, -2.138336181640625, -2.01318359375, -1.888031005859375, -1.76287841796875, -1.637725830078125, -1.5125732421875, -1.387420654296875, -1.26226806640625, -1.137115478515625, -1.011962890625, -0.886810302734375, -0.76165771484375, -0.636505126953125, -0.5113525390625, -0.386199951171875, -0.26104736328125, -0.135894775390625, -0.0107421875, 0.114410400390625, 0.23956298828125, 0.364715576171875, 0.4898681640625, 0.615020751953125, 0.74017333984375, 0.865325927734375, 0.990478515625, 1.115631103515625, 1.24078369140625, 1.365936279296875, 1.4910888671875, 1.616241455078125, 1.74139404296875, 1.866546630859375, 1.99169921875, 2.116851806640625, 2.24200439453125, 2.367156982421875, 2.4923095703125, 2.617462158203125, 2.74261474609375, 2.867767333984375, 2.992919921875, 3.118072509765625, 3.24322509765625, 3.368377685546875, 3.4935302734375, 3.618682861328125, 3.74383544921875, 3.868988037109375, 3.994140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 14.0, 13.0, 21.0, 33.0, 32.0, 64.0, 124.0, 141.0, 244.0, 407.0, 627.0, 983.0, 1481.0, 2572.0, 3743.0, 6279.0, 9908.0, 15953.0, 27132.0, 45483.0, 77539.0, 126638.0, 182235.0, 1233944.0, 141830.0, 88394.0, 52548.0, 30881.0, 18104.0, 11243.0, 6897.0, 4294.0, 2668.0, 1668.0, 1045.0, 684.0, 444.0, 280.0, 178.0, 111.0, 97.0, 56.0, 38.0, 24.0, 15.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.54443359375, -0.5274887084960938, -0.5105438232421875, -0.49359893798828125, -0.476654052734375, -0.45970916748046875, -0.4427642822265625, -0.42581939697265625, -0.40887451171875, -0.39192962646484375, -0.3749847412109375, -0.35803985595703125, -0.341094970703125, -0.32415008544921875, -0.3072052001953125, -0.29026031494140625, -0.2733154296875, -0.25637054443359375, -0.2394256591796875, -0.22248077392578125, -0.205535888671875, -0.18859100341796875, -0.1716461181640625, -0.15470123291015625, -0.13775634765625, -0.12081146240234375, -0.1038665771484375, -0.08692169189453125, -0.069976806640625, -0.05303192138671875, -0.0360870361328125, -0.01914215087890625, -0.002197265625, 0.01474761962890625, 0.0316925048828125, 0.04863739013671875, 0.065582275390625, 0.08252716064453125, 0.0994720458984375, 0.11641693115234375, 0.13336181640625, 0.15030670166015625, 0.1672515869140625, 0.18419647216796875, 0.201141357421875, 0.21808624267578125, 0.2350311279296875, 0.25197601318359375, 0.2689208984375, 0.28586578369140625, 0.3028106689453125, 0.31975555419921875, 0.336700439453125, 0.35364532470703125, 0.3705902099609375, 0.38753509521484375, 0.40447998046875, 0.42142486572265625, 0.4383697509765625, 0.45531463623046875, 0.472259521484375, 0.48920440673828125, 0.5061492919921875, 0.5230941772460938, 0.5400390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 7.0, 5.0, 12.0, 16.0, 11.0, 19.0, 26.0, 26.0, 31.0, 42.0, 39.0, 40.0, 60.0, 52.0, 54.0, 52.0, 50.0, 55.0, 39.0, 50.0, 37.0, 53.0, 36.0, 22.0, 27.0, 23.0, 13.0, 11.0, 14.0, 13.0, 9.0, 10.0, 5.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002277374267578125, -0.0022150129079818726, -0.00215265154838562, -0.0020902901887893677, -0.0020279288291931152, -0.001965567469596863, -0.0019032061100006104, -0.001840844750404358, -0.0017784833908081055, -0.001716122031211853, -0.0016537606716156006, -0.0015913993120193481, -0.0015290379524230957, -0.0014666765928268433, -0.0014043152332305908, -0.0013419538736343384, -0.001279592514038086, -0.0012172311544418335, -0.001154869794845581, -0.0010925084352493286, -0.0010301470756530762, -0.0009677857160568237, -0.0009054243564605713, -0.0008430629968643188, -0.0007807016372680664, -0.000718340277671814, -0.0006559789180755615, -0.0005936175584793091, -0.0005312561988830566, -0.0004688948392868042, -0.00040653347969055176, -0.0003441721200942993, -0.0002818107604980469, -0.00021944940090179443, -0.000157088041305542, -9.472668170928955e-05, -3.236532211303711e-05, 2.9996037483215332e-05, 9.235739707946777e-05, 0.00015471875667572021, 0.00021708011627197266, 0.0002794414758682251, 0.00034180283546447754, 0.00040416419506073, 0.0004665255546569824, 0.0005288869142532349, 0.0005912482738494873, 0.0006536096334457397, 0.0007159709930419922, 0.0007783323526382446, 0.0008406937122344971, 0.0009030550718307495, 0.000965416431427002, 0.0010277777910232544, 0.0010901391506195068, 0.0011525005102157593, 0.0012148618698120117, 0.0012772232294082642, 0.0013395845890045166, 0.001401945948600769, 0.0014643073081970215, 0.001526668667793274, 0.0015890300273895264, 0.0016513913869857788, 0.0017137527465820312]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 13.0, 6.0, 11.0, 15.0, 11.0, 17.0, 15.0, 20.0, 35.0, 34.0, 26.0, 41.0, 55.0, 59.0, 103.0, 160.0, 232.0, 328.0, 576.0, 1257.0, 124462.0, 915796.0, 3043.0, 730.0, 425.0, 279.0, 200.0, 134.0, 104.0, 81.0, 50.0, 55.0, 40.0, 27.0, 22.0, 22.0, 15.0, 10.0, 8.0, 19.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.03149557113647461, -0.03033733367919922, -0.029179096221923828, -0.028020858764648438, -0.026862621307373047, -0.025704383850097656, -0.024546146392822266, -0.023387908935546875, -0.022229671478271484, -0.021071434020996094, -0.019913196563720703, -0.018754959106445312, -0.017596721649169922, -0.01643848419189453, -0.01528024673461914, -0.01412200927734375, -0.01296377182006836, -0.011805534362792969, -0.010647296905517578, -0.009489059448242188, -0.008330821990966797, -0.007172584533691406, -0.006014347076416016, -0.004856109619140625, -0.0036978721618652344, -0.0025396347045898438, -0.0013813972473144531, -0.0002231597900390625, 0.0009350776672363281, 0.0020933151245117188, 0.0032515525817871094, 0.0044097900390625, 0.005568027496337891, 0.006726264953613281, 0.007884502410888672, 0.009042739868164062, 0.010200977325439453, 0.011359214782714844, 0.012517452239990234, 0.013675689697265625, 0.014833927154541016, 0.015992164611816406, 0.017150402069091797, 0.018308639526367188, 0.019466876983642578, 0.02062511444091797, 0.02178335189819336, 0.02294158935546875, 0.02409982681274414, 0.02525806427001953, 0.026416301727294922, 0.027574539184570312, 0.028732776641845703, 0.029891014099121094, 0.031049251556396484, 0.032207489013671875, 0.033365726470947266, 0.034523963928222656, 0.03568220138549805, 0.03684043884277344, 0.03799867630004883, 0.03915691375732422, 0.04031515121459961, 0.041473388671875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 36.0, 491.0, 463.0, 26.0, 0.0, 2.0], "bins": [-0.016192831099033356, -0.01592288166284561, -0.015652932226657867, -0.015382983721792698, -0.015113034285604954, -0.01484308484941721, -0.01457313634455204, -0.014303186908364296, -0.014033237472176552, -0.013763288035988808, -0.013493339531123638, -0.013223390094935894, -0.01295344065874815, -0.012683491222560406, -0.012413542717695236, -0.012143593281507492, -0.011873643845319748, -0.011603694409132004, -0.011333745904266834, -0.01106379646807909, -0.010793847031891346, -0.010523897595703602, -0.010253949090838432, -0.009983999654650688, -0.009714051149785519, -0.009444101713597775, -0.009174153208732605, -0.00890420377254486, -0.008634254336357117, -0.008364304900169373, -0.008094356395304203, -0.007824406959116459, -0.007554457522928715, -0.007284508552402258, -0.007014559116214514, -0.006744610145688057, -0.006474660709500313, -0.006204711738973856, -0.005934762768447399, -0.005664813332259655, -0.005394863896071911, -0.005124914925545454, -0.00485496548935771, -0.004585016518831253, -0.004315067082643509, -0.004045118112117052, -0.0037751689087599516, -0.003505219705402851, -0.0032352707348763943, -0.002965321531519294, -0.0026953723281621933, -0.0024254233576357365, -0.0021554739214479923, -0.0018855248345062137, -0.001615575747564435, -0.0013456265442073345, -0.0010756772244349122, -0.0008057280210778117, -0.0005357788759283721, -0.00026582973077893257, 4.119472578167915e-06, 0.0002740686759352684, 0.0005440177628770471, 0.0008139669662341475, 0.001083916169591248]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 17.0, 18.0, 22.0, 23.0, 24.0, 26.0, 20.0, 34.0, 28.0, 40.0, 41.0, 35.0, 38.0, 32.0, 31.0, 34.0, 49.0, 34.0, 43.0, 41.0, 26.0, 36.0, 38.0, 31.0, 25.0, 23.0, 14.0, 15.0, 19.0, 21.0, 15.0, 18.0, 14.0, 6.0, 8.0, 5.0, 7.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009385347366333008, -0.0009065307676792145, -0.0008745267987251282, -0.0008425228297710419, -0.0008105188608169556, -0.0007785148918628693, -0.000746510922908783, -0.0007145069539546967, -0.0006825029850006104, -0.000650499016046524, -0.0006184950470924377, -0.0005864910781383514, -0.0005544871091842651, -0.0005224831402301788, -0.0004904791712760925, -0.0004584752023220062, -0.0004264712333679199, -0.0003944672644138336, -0.0003624632954597473, -0.000330459326505661, -0.0002984553575515747, -0.0002664513885974884, -0.0002344474196434021, -0.0002024434506893158, -0.0001704394817352295, -0.0001384355127811432, -0.00010643154382705688, -7.442757487297058e-05, -4.242360591888428e-05, -1.0419636964797974e-05, 2.158433198928833e-05, 5.3588300943374634e-05, 8.559226989746094e-05, 0.00011759623885154724, 0.00014960020780563354, 0.00018160417675971985, 0.00021360814571380615, 0.00024561211466789246, 0.00027761608362197876, 0.00030962005257606506, 0.00034162402153015137, 0.00037362799048423767, 0.000405631959438324, 0.0004376359283924103, 0.0004696398973464966, 0.0005016438663005829, 0.0005336478352546692, 0.0005656518042087555, 0.0005976557731628418, 0.0006296597421169281, 0.0006616637110710144, 0.0006936676800251007, 0.000725671648979187, 0.0007576756179332733, 0.0007896795868873596, 0.0008216835558414459, 0.0008536875247955322, 0.0008856914937496185, 0.0009176954627037048, 0.0009496994316577911, 0.0009817034006118774, 0.0010137073695659637, 0.00104571133852005, 0.0010777153074741364, 0.0011097192764282227]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 11.0, 12.0, 12.0, 12.0, 18.0, 14.0, 21.0, 21.0, 28.0, 26.0, 40.0, 31.0, 30.0, 48.0, 40.0, 42.0, 39.0, 37.0, 34.0, 49.0, 36.0, 45.0, 38.0, 35.0, 29.0, 34.0, 34.0, 25.0, 18.0, 21.0, 24.0, 16.0, 16.0, 10.0, 12.0, 6.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.511962890625, -6.30908203125, -6.106201171875, -5.9033203125, -5.700439453125, -5.49755859375, -5.294677734375, -5.091796875, -4.888916015625, -4.68603515625, -4.483154296875, -4.2802734375, -4.077392578125, -3.87451171875, -3.671630859375, -3.46875, -3.265869140625, -3.06298828125, -2.860107421875, -2.6572265625, -2.454345703125, -2.25146484375, -2.048583984375, -1.845703125, -1.642822265625, -1.43994140625, -1.237060546875, -1.0341796875, -0.831298828125, -0.62841796875, -0.425537109375, -0.22265625, -0.019775390625, 0.18310546875, 0.385986328125, 0.5888671875, 0.791748046875, 0.99462890625, 1.197509765625, 1.400390625, 1.603271484375, 1.80615234375, 2.009033203125, 2.2119140625, 2.414794921875, 2.61767578125, 2.820556640625, 3.0234375, 3.226318359375, 3.42919921875, 3.632080078125, 3.8349609375, 4.037841796875, 4.24072265625, 4.443603515625, 4.646484375, 4.849365234375, 5.05224609375, 5.255126953125, 5.4580078125, 5.660888671875, 5.86376953125, 6.066650390625, 6.26953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 13.0, 30.0, 44.0, 77.0, 73.0, 122.0, 147.0, 214.0, 330.0, 433.0, 691.0, 966.0, 1443.0, 2307.0, 4471.0, 12410.0, 85021.0, 693562.0, 209815.0, 22257.0, 5865.0, 2879.0, 1703.0, 1150.0, 719.0, 528.0, 373.0, 269.0, 171.0, 120.0, 89.0, 60.0, 40.0, 38.0, 23.0, 19.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.53125, -15.992431640625, -15.45361328125, -14.914794921875, -14.3759765625, -13.837158203125, -13.29833984375, -12.759521484375, -12.220703125, -11.681884765625, -11.14306640625, -10.604248046875, -10.0654296875, -9.526611328125, -8.98779296875, -8.448974609375, -7.91015625, -7.371337890625, -6.83251953125, -6.293701171875, -5.7548828125, -5.216064453125, -4.67724609375, -4.138427734375, -3.599609375, -3.060791015625, -2.52197265625, -1.983154296875, -1.4443359375, -0.905517578125, -0.36669921875, 0.172119140625, 0.7109375, 1.249755859375, 1.78857421875, 2.327392578125, 2.8662109375, 3.405029296875, 3.94384765625, 4.482666015625, 5.021484375, 5.560302734375, 6.09912109375, 6.637939453125, 7.1767578125, 7.715576171875, 8.25439453125, 8.793212890625, 9.33203125, 9.870849609375, 10.40966796875, 10.948486328125, 11.4873046875, 12.026123046875, 12.56494140625, 13.103759765625, 13.642578125, 14.181396484375, 14.72021484375, 15.259033203125, 15.7978515625, 16.336669921875, 16.87548828125, 17.414306640625, 17.953125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 9.0, 12.0, 7.0, 18.0, 14.0, 11.0, 27.0, 23.0, 39.0, 32.0, 38.0, 45.0, 49.0, 60.0, 68.0, 161.0, 1529.0, 348.0, 130.0, 43.0, 47.0, 54.0, 32.0, 27.0, 38.0, 26.0, 18.0, 20.0, 18.0, 16.0, 13.0, 10.0, 8.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.484375, -15.967041015625, -15.44970703125, -14.932373046875, -14.4150390625, -13.897705078125, -13.38037109375, -12.863037109375, -12.345703125, -11.828369140625, -11.31103515625, -10.793701171875, -10.2763671875, -9.759033203125, -9.24169921875, -8.724365234375, -8.20703125, -7.689697265625, -7.17236328125, -6.655029296875, -6.1376953125, -5.620361328125, -5.10302734375, -4.585693359375, -4.068359375, -3.551025390625, -3.03369140625, -2.516357421875, -1.9990234375, -1.481689453125, -0.96435546875, -0.447021484375, 0.0703125, 0.587646484375, 1.10498046875, 1.622314453125, 2.1396484375, 2.656982421875, 3.17431640625, 3.691650390625, 4.208984375, 4.726318359375, 5.24365234375, 5.760986328125, 6.2783203125, 6.795654296875, 7.31298828125, 7.830322265625, 8.34765625, 8.864990234375, 9.38232421875, 9.899658203125, 10.4169921875, 10.934326171875, 11.45166015625, 11.968994140625, 12.486328125, 13.003662109375, 13.52099609375, 14.038330078125, 14.5556640625, 15.072998046875, 15.59033203125, 16.107666015625, 16.625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 11.0, 10.0, 11.0, 12.0, 18.0, 32.0, 34.0, 42.0, 52.0, 75.0, 101.0, 117.0, 193.0, 335.0, 636.0, 1933.0, 327576.0, 2809807.0, 2756.0, 738.0, 371.0, 231.0, 169.0, 95.0, 74.0, 53.0, 43.0, 40.0, 26.0, 27.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0], "bins": [-58.5625, -56.9833984375, -55.404296875, -53.8251953125, -52.24609375, -50.6669921875, -49.087890625, -47.5087890625, -45.9296875, -44.3505859375, -42.771484375, -41.1923828125, -39.61328125, -38.0341796875, -36.455078125, -34.8759765625, -33.296875, -31.7177734375, -30.138671875, -28.5595703125, -26.98046875, -25.4013671875, -23.822265625, -22.2431640625, -20.6640625, -19.0849609375, -17.505859375, -15.9267578125, -14.34765625, -12.7685546875, -11.189453125, -9.6103515625, -8.03125, -6.4521484375, -4.873046875, -3.2939453125, -1.71484375, -0.1357421875, 1.443359375, 3.0224609375, 4.6015625, 6.1806640625, 7.759765625, 9.3388671875, 10.91796875, 12.4970703125, 14.076171875, 15.6552734375, 17.234375, 18.8134765625, 20.392578125, 21.9716796875, 23.55078125, 25.1298828125, 26.708984375, 28.2880859375, 29.8671875, 31.4462890625, 33.025390625, 34.6044921875, 36.18359375, 37.7626953125, 39.341796875, 40.9208984375, 42.5]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 12.0, 109.0, 413.0, 391.0, 85.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.259794235229492, -21.80027198791504, -17.340749740600586, -12.881227493286133, -8.42170524597168, -3.9621829986572266, 0.49733924865722656, 4.95686149597168, 9.416383743286133, 13.875905990600586, 18.33542823791504, 22.794950485229492, 27.254472732543945, 31.7139949798584, 36.17351531982422, 40.63304138183594, 45.092559814453125, 49.55208206176758, 54.01160430908203, 58.471126556396484, 62.93064880371094, 67.39016723632812, 71.84969329833984, 76.30921936035156, 80.76873779296875, 85.22825622558594, 89.68778228759766, 94.14730834960938, 98.60682678222656, 103.06634521484375, 107.52587127685547, 111.98539733886719, 116.44491577148438, 120.90443420410156, 125.36396026611328, 129.823486328125, 134.2830047607422, 138.74252319335938, 143.20205688476562, 147.6615753173828, 152.12109375, 156.5806121826172, 161.04013061523438, 165.49966430664062, 169.9591827392578, 174.418701171875, 178.87823486328125, 183.33775329589844, 187.79727172851562, 192.2567901611328, 196.71630859375, 201.17584228515625, 205.63536071777344, 210.09487915039062, 214.55441284179688, 219.01393127441406, 223.47344970703125, 227.93296813964844, 232.39248657226562, 236.85202026367188, 241.31153869628906, 245.77105712890625, 250.2305908203125, 254.6901092529297, 259.1496276855469]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 4.0, 4.0, 10.0, 4.0, 7.0, 12.0, 12.0, 10.0, 25.0, 19.0, 24.0, 26.0, 24.0, 21.0, 32.0, 43.0, 51.0, 34.0, 25.0, 51.0, 48.0, 49.0, 42.0, 28.0, 37.0, 38.0, 38.0, 42.0, 29.0, 26.0, 27.0, 18.0, 17.0, 25.0, 17.0, 11.0, 9.0, 16.0, 6.0, 11.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-50.01952362060547, -48.573570251464844, -47.12761688232422, -45.68166732788086, -44.235713958740234, -42.78976058959961, -41.34381103515625, -39.897857666015625, -38.451904296875, -37.005950927734375, -35.55999755859375, -34.11404800415039, -32.668094635009766, -31.22214126586914, -29.77618980407715, -28.330238342285156, -26.88428497314453, -25.438331604003906, -23.992380142211914, -22.546428680419922, -21.100475311279297, -19.654521942138672, -18.20857048034668, -16.762619018554688, -15.316665649414062, -13.870713233947754, -12.424760818481445, -10.978808403015137, -9.532855987548828, -8.08690357208252, -6.640951156616211, -5.194998741149902, -3.7490463256835938, -2.303093910217285, -0.8571414947509766, 0.588810920715332, 2.0347633361816406, 3.480715751647949, 4.926668167114258, 6.372620582580566, 7.818572998046875, 9.264525413513184, 10.710477828979492, 12.1564302444458, 13.60238265991211, 15.048335075378418, 16.494287490844727, 17.94023895263672, 19.386192321777344, 20.83214569091797, 22.27809715270996, 23.724048614501953, 25.170001983642578, 26.615955352783203, 28.061906814575195, 29.507858276367188, 30.953811645507812, 32.39976501464844, 33.84571838378906, 35.29166793823242, 36.73762130737305, 38.18357467651367, 39.62952423095703, 41.075477600097656, 42.52143096923828]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 12.0, 8.0, 11.0, 10.0, 17.0, 19.0, 12.0, 20.0, 20.0, 21.0, 21.0, 21.0, 39.0, 45.0, 36.0, 46.0, 28.0, 45.0, 41.0, 33.0, 30.0, 36.0, 39.0, 50.0, 37.0, 33.0, 25.0, 37.0, 24.0, 33.0, 27.0, 12.0, 11.0, 15.0, 18.0, 15.0, 5.0, 5.0, 11.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.921875, -6.72161865234375, -6.5213623046875, -6.32110595703125, -6.120849609375, -5.92059326171875, -5.7203369140625, -5.52008056640625, -5.31982421875, -5.11956787109375, -4.9193115234375, -4.71905517578125, -4.518798828125, -4.31854248046875, -4.1182861328125, -3.91802978515625, -3.7177734375, -3.51751708984375, -3.3172607421875, -3.11700439453125, -2.916748046875, -2.71649169921875, -2.5162353515625, -2.31597900390625, -2.11572265625, -1.91546630859375, -1.7152099609375, -1.51495361328125, -1.314697265625, -1.11444091796875, -0.9141845703125, -0.71392822265625, -0.513671875, -0.31341552734375, -0.1131591796875, 0.08709716796875, 0.287353515625, 0.48760986328125, 0.6878662109375, 0.88812255859375, 1.08837890625, 1.28863525390625, 1.4888916015625, 1.68914794921875, 1.889404296875, 2.08966064453125, 2.2899169921875, 2.49017333984375, 2.6904296875, 2.89068603515625, 3.0909423828125, 3.29119873046875, 3.491455078125, 3.69171142578125, 3.8919677734375, 4.09222412109375, 4.29248046875, 4.49273681640625, 4.6929931640625, 4.89324951171875, 5.093505859375, 5.29376220703125, 5.4940185546875, 5.69427490234375, 5.89453125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 7.0, 2.0, 1.0, 5.0, 10.0, 13.0, 13.0, 15.0, 26.0, 27.0, 47.0, 63.0, 85.0, 77.0, 146.0, 203.0, 324.0, 493.0, 722.0, 1147.0, 1823.0, 3089.0, 5791.0, 12429.0, 33601.0, 152004.0, 782161.0, 1955151.0, 972645.0, 200345.0, 42421.0, 14149.0, 6216.0, 3404.0, 1954.0, 1275.0, 763.0, 492.0, 345.0, 223.0, 150.0, 115.0, 75.0, 69.0, 44.0, 35.0, 20.0, 19.0, 15.0, 15.0, 5.0, 5.0, 8.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-10.3046875, -9.9884033203125, -9.672119140625, -9.3558349609375, -9.03955078125, -8.7232666015625, -8.406982421875, -8.0906982421875, -7.7744140625, -7.4581298828125, -7.141845703125, -6.8255615234375, -6.50927734375, -6.1929931640625, -5.876708984375, -5.5604248046875, -5.244140625, -4.9278564453125, -4.611572265625, -4.2952880859375, -3.97900390625, -3.6627197265625, -3.346435546875, -3.0301513671875, -2.7138671875, -2.3975830078125, -2.081298828125, -1.7650146484375, -1.44873046875, -1.1324462890625, -0.816162109375, -0.4998779296875, -0.18359375, 0.1326904296875, 0.448974609375, 0.7652587890625, 1.08154296875, 1.3978271484375, 1.714111328125, 2.0303955078125, 2.3466796875, 2.6629638671875, 2.979248046875, 3.2955322265625, 3.61181640625, 3.9281005859375, 4.244384765625, 4.5606689453125, 4.876953125, 5.1932373046875, 5.509521484375, 5.8258056640625, 6.14208984375, 6.4583740234375, 6.774658203125, 7.0909423828125, 7.4072265625, 7.7235107421875, 8.039794921875, 8.3560791015625, 8.67236328125, 8.9886474609375, 9.304931640625, 9.6212158203125, 9.9375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 24.0, 37.0, 64.0, 156.0, 297.0, 587.0, 972.0, 905.0, 516.0, 260.0, 123.0, 55.0, 30.0, 13.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.0625, -25.2451171875, -24.427734375, -23.6103515625, -22.79296875, -21.9755859375, -21.158203125, -20.3408203125, -19.5234375, -18.7060546875, -17.888671875, -17.0712890625, -16.25390625, -15.4365234375, -14.619140625, -13.8017578125, -12.984375, -12.1669921875, -11.349609375, -10.5322265625, -9.71484375, -8.8974609375, -8.080078125, -7.2626953125, -6.4453125, -5.6279296875, -4.810546875, -3.9931640625, -3.17578125, -2.3583984375, -1.541015625, -0.7236328125, 0.09375, 0.9111328125, 1.728515625, 2.5458984375, 3.36328125, 4.1806640625, 4.998046875, 5.8154296875, 6.6328125, 7.4501953125, 8.267578125, 9.0849609375, 9.90234375, 10.7197265625, 11.537109375, 12.3544921875, 13.171875, 13.9892578125, 14.806640625, 15.6240234375, 16.44140625, 17.2587890625, 18.076171875, 18.8935546875, 19.7109375, 20.5283203125, 21.345703125, 22.1630859375, 22.98046875, 23.7978515625, 24.615234375, 25.4326171875, 26.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 12.0, 12.0, 19.0, 38.0, 93.0, 220.0, 601.0, 1585.0, 10874.0, 4021423.0, 154766.0, 2977.0, 922.0, 365.0, 152.0, 84.0, 49.0, 29.0, 11.0, 13.0, 5.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.59375, -55.88623046875, -54.1787109375, -52.47119140625, -50.763671875, -49.05615234375, -47.3486328125, -45.64111328125, -43.93359375, -42.22607421875, -40.5185546875, -38.81103515625, -37.103515625, -35.39599609375, -33.6884765625, -31.98095703125, -30.2734375, -28.56591796875, -26.8583984375, -25.15087890625, -23.443359375, -21.73583984375, -20.0283203125, -18.32080078125, -16.61328125, -14.90576171875, -13.1982421875, -11.49072265625, -9.783203125, -8.07568359375, -6.3681640625, -4.66064453125, -2.953125, -1.24560546875, 0.4619140625, 2.16943359375, 3.876953125, 5.58447265625, 7.2919921875, 8.99951171875, 10.70703125, 12.41455078125, 14.1220703125, 15.82958984375, 17.537109375, 19.24462890625, 20.9521484375, 22.65966796875, 24.3671875, 26.07470703125, 27.7822265625, 29.48974609375, 31.197265625, 32.90478515625, 34.6123046875, 36.31982421875, 38.02734375, 39.73486328125, 41.4423828125, 43.14990234375, 44.857421875, 46.56494140625, 48.2724609375, 49.97998046875, 51.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 248.0, 761.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.84329223632812, -141.57958984375, -124.31590270996094, -107.05220794677734, -89.78851318359375, -72.52481842041016, -55.26112365722656, -37.99742889404297, -20.733734130859375, -3.4700393676757812, 13.793655395507812, 31.057350158691406, 48.321044921875, 65.5847396850586, 82.84843444824219, 100.11212921142578, 117.37582397460938, 134.6395263671875, 151.90321350097656, 169.16690063476562, 186.43060302734375, 203.69430541992188, 220.95799255371094, 238.2216796875, 255.48538208007812, 272.74908447265625, 290.01275634765625, 307.2764587402344, 324.5401611328125, 341.8038635253906, 359.06756591796875, 376.33123779296875, 393.59490966796875, 410.8586120605469, 428.122314453125, 445.385986328125, 462.6496887207031, 479.91339111328125, 497.17706298828125, 514.4407958984375, 531.7044677734375, 548.9681396484375, 566.2318725585938, 583.4955444335938, 600.75927734375, 618.02294921875, 635.28662109375, 652.5503540039062, 669.8140258789062, 687.0776977539062, 704.3414306640625, 721.6051025390625, 738.8687744140625, 756.1325073242188, 773.3961791992188, 790.659912109375, 807.923583984375, 825.187255859375, 842.4509887695312, 859.7146606445312, 876.9783935546875, 894.2420654296875, 911.5057373046875, 928.7694702148438, 946.0331420898438]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 6.0, 8.0, 6.0, 10.0, 12.0, 11.0, 21.0, 17.0, 12.0, 21.0, 29.0, 24.0, 29.0, 33.0, 36.0, 37.0, 49.0, 33.0, 51.0, 37.0, 35.0, 36.0, 45.0, 36.0, 39.0, 36.0, 34.0, 26.0, 35.0, 24.0, 30.0, 23.0, 25.0, 19.0, 15.0, 11.0, 8.0, 8.0, 6.0, 7.0, 5.0, 1.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.69012451171875, -43.33840560913086, -41.98668670654297, -40.634971618652344, -39.28325271606445, -37.93153381347656, -36.57981872558594, -35.22809982299805, -33.876380920410156, -32.524662017822266, -31.172945022583008, -29.82122802734375, -28.46950912475586, -27.11779022216797, -25.76607322692871, -24.414356231689453, -23.062637329101562, -21.710918426513672, -20.359201431274414, -19.007484436035156, -17.655765533447266, -16.304046630859375, -14.952329635620117, -13.600611686706543, -12.248893737792969, -10.897175788879395, -9.54545783996582, -8.193739891052246, -6.842021942138672, -5.490303993225098, -4.138586044311523, -2.786868095397949, -1.435150146484375, -0.08343219757080078, 1.2682857513427734, 2.6200037002563477, 3.971721649169922, 5.323439598083496, 6.67515754699707, 8.026875495910645, 9.378593444824219, 10.730311393737793, 12.082029342651367, 13.433747291564941, 14.785465240478516, 16.137184143066406, 17.488901138305664, 18.840618133544922, 20.192337036132812, 21.544055938720703, 22.89577293395996, 24.24748992919922, 25.59920883178711, 26.950927734375, 28.302644729614258, 29.654361724853516, 31.006080627441406, 32.3577995300293, 33.70951843261719, 35.06123352050781, 36.4129524230957, 37.764671325683594, 39.11638641357422, 40.46810531616211, 41.81982421875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 3.0, 11.0, 8.0, 25.0, 12.0, 20.0, 15.0, 20.0, 26.0, 29.0, 41.0, 28.0, 32.0, 29.0, 37.0, 27.0, 41.0, 29.0, 45.0, 49.0, 45.0, 36.0, 34.0, 36.0, 34.0, 30.0, 31.0, 33.0, 13.0, 19.0, 18.0, 15.0, 9.0, 17.0, 13.0, 9.0, 15.0, 6.0, 6.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.40625, -5.2362060546875, -5.066162109375, -4.8961181640625, -4.72607421875, -4.5560302734375, -4.385986328125, -4.2159423828125, -4.0458984375, -3.8758544921875, -3.705810546875, -3.5357666015625, -3.36572265625, -3.1956787109375, -3.025634765625, -2.8555908203125, -2.685546875, -2.5155029296875, -2.345458984375, -2.1754150390625, -2.00537109375, -1.8353271484375, -1.665283203125, -1.4952392578125, -1.3251953125, -1.1551513671875, -0.985107421875, -0.8150634765625, -0.64501953125, -0.4749755859375, -0.304931640625, -0.1348876953125, 0.03515625, 0.2052001953125, 0.375244140625, 0.5452880859375, 0.71533203125, 0.8853759765625, 1.055419921875, 1.2254638671875, 1.3955078125, 1.5655517578125, 1.735595703125, 1.9056396484375, 2.07568359375, 2.2457275390625, 2.415771484375, 2.5858154296875, 2.755859375, 2.9259033203125, 3.095947265625, 3.2659912109375, 3.43603515625, 3.6060791015625, 3.776123046875, 3.9461669921875, 4.1162109375, 4.2862548828125, 4.456298828125, 4.6263427734375, 4.79638671875, 4.9664306640625, 5.136474609375, 5.3065185546875, 5.4765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 9.0, 6.0, 11.0, 15.0, 33.0, 30.0, 41.0, 61.0, 115.0, 170.0, 239.0, 400.0, 578.0, 900.0, 1358.0, 2117.0, 3295.0, 5113.0, 8323.0, 13398.0, 21888.0, 37478.0, 63684.0, 110468.0, 174195.0, 208413.0, 158255.0, 97483.0, 56017.0, 32654.0, 19347.0, 11969.0, 7364.0, 4706.0, 2996.0, 1933.0, 1226.0, 792.0, 512.0, 295.0, 202.0, 151.0, 104.0, 68.0, 54.0, 31.0, 23.0, 21.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5674362182617188, -0.5499114990234375, -0.5323867797851562, -0.514862060546875, -0.49733734130859375, -0.4798126220703125, -0.46228790283203125, -0.44476318359375, -0.42723846435546875, -0.4097137451171875, -0.39218902587890625, -0.374664306640625, -0.35713958740234375, -0.3396148681640625, -0.32209014892578125, -0.3045654296875, -0.28704071044921875, -0.2695159912109375, -0.25199127197265625, -0.234466552734375, -0.21694183349609375, -0.1994171142578125, -0.18189239501953125, -0.16436767578125, -0.14684295654296875, -0.1293182373046875, -0.11179351806640625, -0.094268798828125, -0.07674407958984375, -0.0592193603515625, -0.04169464111328125, -0.024169921875, -0.00664520263671875, 0.0108795166015625, 0.02840423583984375, 0.045928955078125, 0.06345367431640625, 0.0809783935546875, 0.09850311279296875, 0.11602783203125, 0.13355255126953125, 0.1510772705078125, 0.16860198974609375, 0.186126708984375, 0.20365142822265625, 0.2211761474609375, 0.23870086669921875, 0.2562255859375, 0.27375030517578125, 0.2912750244140625, 0.30879974365234375, 0.326324462890625, 0.34384918212890625, 0.3613739013671875, 0.37889862060546875, 0.39642333984375, 0.41394805908203125, 0.4314727783203125, 0.44899749755859375, 0.466522216796875, 0.48404693603515625, 0.5015716552734375, 0.5190963745117188, 0.53662109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 7.0, 11.0, 8.0, 7.0, 20.0, 14.0, 17.0, 23.0, 27.0, 26.0, 38.0, 40.0, 33.0, 37.0, 41.0, 53.0, 37.0, 45.0, 1068.0, 28.0, 43.0, 38.0, 44.0, 46.0, 32.0, 40.0, 35.0, 28.0, 20.0, 21.0, 16.0, 13.0, 12.0, 8.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.873046875, -3.748382568359375, -3.62371826171875, -3.499053955078125, -3.3743896484375, -3.249725341796875, -3.12506103515625, -3.000396728515625, -2.875732421875, -2.751068115234375, -2.62640380859375, -2.501739501953125, -2.3770751953125, -2.252410888671875, -2.12774658203125, -2.003082275390625, -1.87841796875, -1.753753662109375, -1.62908935546875, -1.504425048828125, -1.3797607421875, -1.255096435546875, -1.13043212890625, -1.005767822265625, -0.881103515625, -0.756439208984375, -0.63177490234375, -0.507110595703125, -0.3824462890625, -0.257781982421875, -0.13311767578125, -0.008453369140625, 0.1162109375, 0.240875244140625, 0.36553955078125, 0.490203857421875, 0.6148681640625, 0.739532470703125, 0.86419677734375, 0.988861083984375, 1.113525390625, 1.238189697265625, 1.36285400390625, 1.487518310546875, 1.6121826171875, 1.736846923828125, 1.86151123046875, 1.986175537109375, 2.11083984375, 2.235504150390625, 2.36016845703125, 2.484832763671875, 2.6094970703125, 2.734161376953125, 2.85882568359375, 2.983489990234375, 3.108154296875, 3.232818603515625, 3.35748291015625, 3.482147216796875, 3.6068115234375, 3.731475830078125, 3.85614013671875, 3.980804443359375, 4.10546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 29.0, 37.0, 41.0, 92.0, 130.0, 200.0, 307.0, 465.0, 694.0, 1161.0, 1758.0, 2693.0, 4369.0, 6996.0, 11272.0, 18432.0, 29416.0, 48043.0, 80177.0, 126483.0, 175785.0, 1221696.0, 137747.0, 88804.0, 54145.0, 32446.0, 20049.0, 12361.0, 7865.0, 4958.0, 3075.0, 1967.0, 1213.0, 786.0, 502.0, 328.0, 189.0, 130.0, 83.0, 72.0, 40.0, 21.0, 11.0, 14.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4462890625, -0.4323883056640625, -0.418487548828125, -0.4045867919921875, -0.39068603515625, -0.3767852783203125, -0.362884521484375, -0.3489837646484375, -0.3350830078125, -0.3211822509765625, -0.307281494140625, -0.2933807373046875, -0.27947998046875, -0.2655792236328125, -0.251678466796875, -0.2377777099609375, -0.223876953125, -0.2099761962890625, -0.196075439453125, -0.1821746826171875, -0.16827392578125, -0.1543731689453125, -0.140472412109375, -0.1265716552734375, -0.1126708984375, -0.0987701416015625, -0.084869384765625, -0.0709686279296875, -0.05706787109375, -0.0431671142578125, -0.029266357421875, -0.0153656005859375, -0.00146484375, 0.0124359130859375, 0.026336669921875, 0.0402374267578125, 0.05413818359375, 0.0680389404296875, 0.081939697265625, 0.0958404541015625, 0.1097412109375, 0.1236419677734375, 0.137542724609375, 0.1514434814453125, 0.16534423828125, 0.1792449951171875, 0.193145751953125, 0.2070465087890625, 0.220947265625, 0.2348480224609375, 0.248748779296875, 0.2626495361328125, 0.27655029296875, 0.2904510498046875, 0.304351806640625, 0.3182525634765625, 0.3321533203125, 0.3460540771484375, 0.359954833984375, 0.3738555908203125, 0.38775634765625, 0.4016571044921875, 0.415557861328125, 0.4294586181640625, 0.443359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 7.0, 9.0, 11.0, 11.0, 11.0, 31.0, 32.0, 32.0, 46.0, 36.0, 43.0, 48.0, 55.0, 64.0, 63.0, 71.0, 66.0, 72.0, 53.0, 36.0, 52.0, 31.0, 25.0, 20.0, 12.0, 17.0, 8.0, 7.0, 7.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001407623291015625, -0.0013539493083953857, -0.0013002753257751465, -0.0012466013431549072, -0.001192927360534668, -0.0011392533779144287, -0.0010855793952941895, -0.0010319054126739502, -0.000978231430053711, -0.0009245574474334717, -0.0008708834648132324, -0.0008172094821929932, -0.0007635354995727539, -0.0007098615169525146, -0.0006561875343322754, -0.0006025135517120361, -0.0005488395690917969, -0.0004951655864715576, -0.00044149160385131836, -0.0003878176212310791, -0.00033414363861083984, -0.0002804696559906006, -0.00022679567337036133, -0.00017312169075012207, -0.00011944770812988281, -6.577372550964355e-05, -1.2099742889404297e-05, 4.157423973083496e-05, 9.524822235107422e-05, 0.00014892220497131348, 0.00020259618759155273, 0.000256270170211792, 0.00030994415283203125, 0.0003636181354522705, 0.00041729211807250977, 0.000470966100692749, 0.0005246400833129883, 0.0005783140659332275, 0.0006319880485534668, 0.0006856620311737061, 0.0007393360137939453, 0.0007930099964141846, 0.0008466839790344238, 0.0009003579616546631, 0.0009540319442749023, 0.0010077059268951416, 0.0010613799095153809, 0.0011150538921356201, 0.0011687278747558594, 0.0012224018573760986, 0.0012760758399963379, 0.0013297498226165771, 0.0013834238052368164, 0.0014370977878570557, 0.001490771770477295, 0.0015444457530975342, 0.0015981197357177734, 0.0016517937183380127, 0.001705467700958252, 0.0017591416835784912, 0.0018128156661987305, 0.0018664896488189697, 0.001920163631439209, 0.0019738376140594482, 0.0020275115966796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 10.0, 11.0, 18.0, 28.0, 19.0, 32.0, 45.0, 78.0, 85.0, 141.0, 180.0, 261.0, 422.0, 763.0, 2438.0, 969733.0, 71455.0, 1133.0, 573.0, 344.0, 195.0, 143.0, 114.0, 94.0, 52.0, 43.0, 26.0, 20.0, 24.0, 16.0, 9.0, 11.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032440185546875, -0.031450748443603516, -0.03046131134033203, -0.029471874237060547, -0.028482437133789062, -0.027493000030517578, -0.026503562927246094, -0.02551412582397461, -0.024524688720703125, -0.02353525161743164, -0.022545814514160156, -0.021556377410888672, -0.020566940307617188, -0.019577503204345703, -0.01858806610107422, -0.017598628997802734, -0.01660919189453125, -0.015619754791259766, -0.014630317687988281, -0.013640880584716797, -0.012651443481445312, -0.011662006378173828, -0.010672569274902344, -0.00968313217163086, -0.008693695068359375, -0.007704257965087891, -0.006714820861816406, -0.005725383758544922, -0.0047359466552734375, -0.003746509552001953, -0.0027570724487304688, -0.0017676353454589844, -0.0007781982421875, 0.00021123886108398438, 0.0012006759643554688, 0.002190113067626953, 0.0031795501708984375, 0.004168987274169922, 0.005158424377441406, 0.006147861480712891, 0.007137298583984375, 0.00812673568725586, 0.009116172790527344, 0.010105609893798828, 0.011095046997070312, 0.012084484100341797, 0.013073921203613281, 0.014063358306884766, 0.01505279541015625, 0.016042232513427734, 0.01703166961669922, 0.018021106719970703, 0.019010543823242188, 0.019999980926513672, 0.020989418029785156, 0.02197885513305664, 0.022968292236328125, 0.02395772933959961, 0.024947166442871094, 0.025936603546142578, 0.026926040649414062, 0.027915477752685547, 0.02890491485595703, 0.029894351959228516, 0.0308837890625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 382.0, 471.0, 99.0, 15.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022740066051483154, -0.0021412076894193888, -0.002008408773690462, -0.0018756099743768573, -0.0017428110586479306, -0.001610012142919004, -0.0014772133436053991, -0.0013444144278764725, -0.0012116155121475458, -0.0010788165964186192, -0.0009460177388973534, -0.0008132188813760877, -0.000680419965647161, -0.0005476210499182343, -0.0004148221923969686, -0.00028202333487570286, -0.0001492244191467762, -1.6425532521679997e-05, 0.0001163733541034162, 0.0002491722407285124, 0.0003819711273536086, 0.0005147700430825353, 0.000647568900603801, 0.0007803677581250668, 0.0009131666738539934, 0.00104596558958292, 0.0011787645053118467, 0.0013115633046254516, 0.0014443622203543782, 0.0015771611360833049, 0.0017099599353969097, 0.0018427588511258364, 0.0019755582325160503, 0.002108357148244977, 0.0022411560639739037, 0.0023739549797028303, 0.002506753895431757, 0.00263955257833004, 0.0027723514940589666, 0.0029051504097878933, 0.00303794932551682, 0.0031707482412457466, 0.0033035471569746733, 0.0034363460727036, 0.003569144755601883, 0.0037019439041614532, 0.0038347425870597363, 0.003967541269958019, 0.00410034041851759, 0.004233139101415873, 0.004365938249975443, 0.004498736932873726, 0.004631536081433296, 0.004764334764331579, 0.0048971339128911495, 0.0050299325957894325, 0.005162731744349003, 0.005295530427247286, 0.005428329575806856, 0.005561128258705139, 0.0056939274072647095, 0.0058267260901629925, 0.005959525238722563, 0.006092323921620846, 0.006225122604519129]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 5.0, 3.0, 12.0, 6.0, 12.0, 16.0, 9.0, 11.0, 17.0, 25.0, 31.0, 22.0, 29.0, 36.0, 43.0, 32.0, 55.0, 51.0, 52.0, 35.0, 43.0, 38.0, 37.0, 38.0, 39.0, 42.0, 29.0, 25.0, 35.0, 28.0, 22.0, 24.0, 17.0, 10.0, 20.0, 15.0, 5.0, 7.0, 6.0, 2.0, 8.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007296176627278328, -0.0007034484297037125, -0.0006772791966795921, -0.0006511099636554718, -0.0006249407306313515, -0.0005987714976072311, -0.0005726022645831108, -0.0005464330315589905, -0.0005202637985348701, -0.0004940945655107498, -0.0004679253324866295, -0.00044175609946250916, -0.0004155868664383888, -0.0003894176334142685, -0.00036324840039014816, -0.00033707916736602783, -0.0003109099343419075, -0.00028474070131778717, -0.00025857146829366684, -0.0002324022352695465, -0.00020623300224542618, -0.00018006376922130585, -0.00015389453619718552, -0.00012772530317306519, -0.00010155607014894485, -7.538683712482452e-05, -4.921760410070419e-05, -2.3048371076583862e-05, 3.1208619475364685e-06, 2.92900949716568e-05, 5.545932799577713e-05, 8.162856101989746e-05, 0.00010779779404401779, 0.00013396702706813812, 0.00016013626009225845, 0.00018630549311637878, 0.00021247472614049911, 0.00023864395916461945, 0.0002648131921887398, 0.0002909824252128601, 0.00031715165823698044, 0.00034332089126110077, 0.0003694901242852211, 0.00039565935730934143, 0.00042182859033346176, 0.0004479978233575821, 0.0004741670563817024, 0.0005003362894058228, 0.0005265055224299431, 0.0005526747554540634, 0.0005788439884781837, 0.0006050132215023041, 0.0006311824545264244, 0.0006573516875505447, 0.0006835209205746651, 0.0007096901535987854, 0.0007358593866229057, 0.0007620286196470261, 0.0007881978526711464, 0.0008143670856952667, 0.0008405363187193871, 0.0008667055517435074, 0.0008928747847676277, 0.000919044017791748]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 3.0, 11.0, 8.0, 25.0, 12.0, 20.0, 15.0, 20.0, 26.0, 29.0, 41.0, 28.0, 32.0, 29.0, 37.0, 27.0, 41.0, 29.0, 45.0, 49.0, 45.0, 36.0, 34.0, 36.0, 34.0, 30.0, 31.0, 33.0, 13.0, 19.0, 18.0, 15.0, 9.0, 17.0, 13.0, 9.0, 15.0, 6.0, 6.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.40625, -5.2362060546875, -5.066162109375, -4.8961181640625, -4.72607421875, -4.5560302734375, -4.385986328125, -4.2159423828125, -4.0458984375, -3.8758544921875, -3.705810546875, -3.5357666015625, -3.36572265625, -3.1956787109375, -3.025634765625, -2.8555908203125, -2.685546875, -2.5155029296875, -2.345458984375, -2.1754150390625, -2.00537109375, -1.8353271484375, -1.665283203125, -1.4952392578125, -1.3251953125, -1.1551513671875, -0.985107421875, -0.8150634765625, -0.64501953125, -0.4749755859375, -0.304931640625, -0.1348876953125, 0.03515625, 0.2052001953125, 0.375244140625, 0.5452880859375, 0.71533203125, 0.8853759765625, 1.055419921875, 1.2254638671875, 1.3955078125, 1.5655517578125, 1.735595703125, 1.9056396484375, 2.07568359375, 2.2457275390625, 2.415771484375, 2.5858154296875, 2.755859375, 2.9259033203125, 3.095947265625, 3.2659912109375, 3.43603515625, 3.6060791015625, 3.776123046875, 3.9461669921875, 4.1162109375, 4.2862548828125, 4.456298828125, 4.6263427734375, 4.79638671875, 4.9664306640625, 5.136474609375, 5.3065185546875, 5.4765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 6.0, 8.0, 17.0, 20.0, 34.0, 38.0, 45.0, 58.0, 76.0, 119.0, 159.0, 226.0, 310.0, 436.0, 627.0, 1045.0, 1920.0, 4107.0, 10885.0, 37425.0, 198397.0, 612174.0, 134753.0, 28763.0, 8710.0, 3527.0, 1708.0, 963.0, 570.0, 362.0, 291.0, 175.0, 142.0, 102.0, 84.0, 58.0, 48.0, 29.0, 31.0, 22.0, 19.0, 18.0, 6.0, 6.0, 11.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.492431640625, -9.18017578125, -8.867919921875, -8.5556640625, -8.243408203125, -7.93115234375, -7.618896484375, -7.306640625, -6.994384765625, -6.68212890625, -6.369873046875, -6.0576171875, -5.745361328125, -5.43310546875, -5.120849609375, -4.80859375, -4.496337890625, -4.18408203125, -3.871826171875, -3.5595703125, -3.247314453125, -2.93505859375, -2.622802734375, -2.310546875, -1.998291015625, -1.68603515625, -1.373779296875, -1.0615234375, -0.749267578125, -0.43701171875, -0.124755859375, 0.1875, 0.499755859375, 0.81201171875, 1.124267578125, 1.4365234375, 1.748779296875, 2.06103515625, 2.373291015625, 2.685546875, 2.997802734375, 3.31005859375, 3.622314453125, 3.9345703125, 4.246826171875, 4.55908203125, 4.871337890625, 5.18359375, 5.495849609375, 5.80810546875, 6.120361328125, 6.4326171875, 6.744873046875, 7.05712890625, 7.369384765625, 7.681640625, 7.993896484375, 8.30615234375, 8.618408203125, 8.9306640625, 9.242919921875, 9.55517578125, 9.867431640625, 10.1796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 5.0, 4.0, 5.0, 8.0, 13.0, 7.0, 23.0, 12.0, 25.0, 22.0, 35.0, 42.0, 59.0, 58.0, 84.0, 132.0, 457.0, 1483.0, 140.0, 89.0, 66.0, 50.0, 49.0, 31.0, 28.0, 24.0, 20.0, 18.0, 14.0, 9.0, 2.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.904296875, -15.29296875, -14.681640625, -14.0703125, -13.458984375, -12.84765625, -12.236328125, -11.625, -11.013671875, -10.40234375, -9.791015625, -9.1796875, -8.568359375, -7.95703125, -7.345703125, -6.734375, -6.123046875, -5.51171875, -4.900390625, -4.2890625, -3.677734375, -3.06640625, -2.455078125, -1.84375, -1.232421875, -0.62109375, -0.009765625, 0.6015625, 1.212890625, 1.82421875, 2.435546875, 3.046875, 3.658203125, 4.26953125, 4.880859375, 5.4921875, 6.103515625, 6.71484375, 7.326171875, 7.9375, 8.548828125, 9.16015625, 9.771484375, 10.3828125, 10.994140625, 11.60546875, 12.216796875, 12.828125, 13.439453125, 14.05078125, 14.662109375, 15.2734375, 15.884765625, 16.49609375, 17.107421875, 17.71875, 18.330078125, 18.94140625, 19.552734375, 20.1640625, 20.775390625, 21.38671875, 21.998046875, 22.609375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 9.0, 11.0, 15.0, 24.0, 38.0, 47.0, 78.0, 121.0, 196.0, 421.0, 927.0, 10417.0, 3128370.0, 3429.0, 735.0, 318.0, 167.0, 122.0, 67.0, 57.0, 25.0, 33.0, 8.0, 10.0, 9.0, 3.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0], "bins": [-67.625, -65.90771484375, -64.1904296875, -62.47314453125, -60.755859375, -59.03857421875, -57.3212890625, -55.60400390625, -53.88671875, -52.16943359375, -50.4521484375, -48.73486328125, -47.017578125, -45.30029296875, -43.5830078125, -41.86572265625, -40.1484375, -38.43115234375, -36.7138671875, -34.99658203125, -33.279296875, -31.56201171875, -29.8447265625, -28.12744140625, -26.41015625, -24.69287109375, -22.9755859375, -21.25830078125, -19.541015625, -17.82373046875, -16.1064453125, -14.38916015625, -12.671875, -10.95458984375, -9.2373046875, -7.52001953125, -5.802734375, -4.08544921875, -2.3681640625, -0.65087890625, 1.06640625, 2.78369140625, 4.5009765625, 6.21826171875, 7.935546875, 9.65283203125, 11.3701171875, 13.08740234375, 14.8046875, 16.52197265625, 18.2392578125, 19.95654296875, 21.673828125, 23.39111328125, 25.1083984375, 26.82568359375, 28.54296875, 30.26025390625, 31.9775390625, 33.69482421875, 35.412109375, 37.12939453125, 38.8466796875, 40.56396484375, 42.28125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 284.0, 673.0, 44.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.14484405517578, -105.12804412841797, -101.11124420166016, -97.09444427490234, -93.07764434814453, -89.06084442138672, -85.0440444946289, -81.0272445678711, -77.01044464111328, -72.99364471435547, -68.97684478759766, -64.96004486083984, -60.94324493408203, -56.92644500732422, -52.909645080566406, -48.892845153808594, -44.87604522705078, -40.85924530029297, -36.842445373535156, -32.825645446777344, -28.80884552001953, -24.79204559326172, -20.775245666503906, -16.758445739746094, -12.741645812988281, -8.724845886230469, -4.708045959472656, -0.6912460327148438, 3.3255538940429688, 7.342353820800781, 11.359153747558594, 15.375953674316406, 19.392745971679688, 23.4095458984375, 27.426345825195312, 31.443145751953125, 35.45994567871094, 39.47674560546875, 43.49354553222656, 47.510345458984375, 51.52714538574219, 55.5439453125, 59.56074523925781, 63.577545166015625, 67.59434509277344, 71.61114501953125, 75.62794494628906, 79.64474487304688, 83.66154479980469, 87.6783447265625, 91.69514465332031, 95.71194458007812, 99.72874450683594, 103.74554443359375, 107.76234436035156, 111.77914428710938, 115.79594421386719, 119.812744140625, 123.82954406738281, 127.84634399414062, 131.86314392089844, 135.87994384765625, 139.89674377441406, 143.91354370117188, 147.9303436279297]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 6.0, 9.0, 16.0, 5.0, 15.0, 12.0, 27.0, 26.0, 33.0, 35.0, 29.0, 33.0, 27.0, 45.0, 30.0, 39.0, 43.0, 47.0, 54.0, 50.0, 37.0, 33.0, 35.0, 44.0, 28.0, 34.0, 35.0, 24.0, 23.0, 18.0, 20.0, 14.0, 12.0, 11.0, 12.0, 7.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.24935531616211, -36.01531219482422, -34.78126525878906, -33.547218322753906, -32.313175201416016, -31.079130172729492, -29.84508514404297, -28.611040115356445, -27.376995086669922, -26.1429500579834, -24.908905029296875, -23.67486000061035, -22.440814971923828, -21.206769943237305, -19.97272491455078, -18.738679885864258, -17.504634857177734, -16.27058982849121, -15.036544799804688, -13.802499771118164, -12.56845474243164, -11.334409713745117, -10.100364685058594, -8.86631965637207, -7.632274627685547, -6.398229598999023, -5.1641845703125, -3.9301395416259766, -2.696094512939453, -1.4620494842529297, -0.22800445556640625, 1.0060405731201172, 2.240081787109375, 3.4741268157958984, 4.708171844482422, 5.942216873168945, 7.176261901855469, 8.410306930541992, 9.644351959228516, 10.878396987915039, 12.112442016601562, 13.346487045288086, 14.58053207397461, 15.814577102661133, 17.048622131347656, 18.28266716003418, 19.516712188720703, 20.750757217407227, 21.98480224609375, 23.218847274780273, 24.452892303466797, 25.68693733215332, 26.920982360839844, 28.155027389526367, 29.38907241821289, 30.623117446899414, 31.857162475585938, 33.091209411621094, 34.325252532958984, 35.559295654296875, 36.79334259033203, 38.02738952636719, 39.26143264770508, 40.49547576904297, 41.729522705078125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 9.0, 5.0, 8.0, 13.0, 17.0, 12.0, 16.0, 19.0, 14.0, 25.0, 33.0, 46.0, 46.0, 32.0, 43.0, 34.0, 50.0, 43.0, 41.0, 36.0, 43.0, 45.0, 40.0, 36.0, 28.0, 41.0, 29.0, 29.0, 25.0, 18.0, 17.0, 16.0, 22.0, 12.0, 11.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.27618408203125, -7.0484619140625, -6.82073974609375, -6.593017578125, -6.36529541015625, -6.1375732421875, -5.90985107421875, -5.68212890625, -5.45440673828125, -5.2266845703125, -4.99896240234375, -4.771240234375, -4.54351806640625, -4.3157958984375, -4.08807373046875, -3.8603515625, -3.63262939453125, -3.4049072265625, -3.17718505859375, -2.949462890625, -2.72174072265625, -2.4940185546875, -2.26629638671875, -2.03857421875, -1.81085205078125, -1.5831298828125, -1.35540771484375, -1.127685546875, -0.89996337890625, -0.6722412109375, -0.44451904296875, -0.216796875, 0.01092529296875, 0.2386474609375, 0.46636962890625, 0.694091796875, 0.92181396484375, 1.1495361328125, 1.37725830078125, 1.60498046875, 1.83270263671875, 2.0604248046875, 2.28814697265625, 2.515869140625, 2.74359130859375, 2.9713134765625, 3.19903564453125, 3.4267578125, 3.65447998046875, 3.8822021484375, 4.10992431640625, 4.337646484375, 4.56536865234375, 4.7930908203125, 5.02081298828125, 5.24853515625, 5.47625732421875, 5.7039794921875, 5.93170166015625, 6.159423828125, 6.38714599609375, 6.6148681640625, 6.84259033203125, 7.0703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 13.0, 10.0, 19.0, 17.0, 27.0, 36.0, 45.0, 50.0, 65.0, 74.0, 114.0, 153.0, 158.0, 232.0, 391.0, 506.0, 860.0, 1971.0, 10876.0, 842931.0, 3287922.0, 40930.0, 3484.0, 1079.0, 584.0, 473.0, 295.0, 219.0, 161.0, 132.0, 96.0, 65.0, 58.0, 51.0, 44.0, 26.0, 23.0, 18.0, 17.0, 15.0, 12.0, 2.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-43.25, -42.021484375, -40.79296875, -39.564453125, -38.3359375, -37.107421875, -35.87890625, -34.650390625, -33.421875, -32.193359375, -30.96484375, -29.736328125, -28.5078125, -27.279296875, -26.05078125, -24.822265625, -23.59375, -22.365234375, -21.13671875, -19.908203125, -18.6796875, -17.451171875, -16.22265625, -14.994140625, -13.765625, -12.537109375, -11.30859375, -10.080078125, -8.8515625, -7.623046875, -6.39453125, -5.166015625, -3.9375, -2.708984375, -1.48046875, -0.251953125, 0.9765625, 2.205078125, 3.43359375, 4.662109375, 5.890625, 7.119140625, 8.34765625, 9.576171875, 10.8046875, 12.033203125, 13.26171875, 14.490234375, 15.71875, 16.947265625, 18.17578125, 19.404296875, 20.6328125, 21.861328125, 23.08984375, 24.318359375, 25.546875, 26.775390625, 28.00390625, 29.232421875, 30.4609375, 31.689453125, 32.91796875, 34.146484375, 35.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 9.0, 11.0, 13.0, 43.0, 73.0, 111.0, 186.0, 399.0, 705.0, 912.0, 696.0, 410.0, 200.0, 113.0, 69.0, 44.0, 25.0, 16.0, 10.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.4390869140625, -10.823486328125, -10.2078857421875, -9.59228515625, -8.9766845703125, -8.361083984375, -7.7454833984375, -7.1298828125, -6.5142822265625, -5.898681640625, -5.2830810546875, -4.66748046875, -4.0518798828125, -3.436279296875, -2.8206787109375, -2.205078125, -1.5894775390625, -0.973876953125, -0.3582763671875, 0.25732421875, 0.8729248046875, 1.488525390625, 2.1041259765625, 2.7197265625, 3.3353271484375, 3.950927734375, 4.5665283203125, 5.18212890625, 5.7977294921875, 6.413330078125, 7.0289306640625, 7.64453125, 8.2601318359375, 8.875732421875, 9.4913330078125, 10.10693359375, 10.7225341796875, 11.338134765625, 11.9537353515625, 12.5693359375, 13.1849365234375, 13.800537109375, 14.4161376953125, 15.03173828125, 15.6473388671875, 16.262939453125, 16.8785400390625, 17.494140625, 18.1097412109375, 18.725341796875, 19.3409423828125, 19.95654296875, 20.5721435546875, 21.187744140625, 21.8033447265625, 22.4189453125, 23.0345458984375, 23.650146484375, 24.2657470703125, 24.88134765625, 25.4969482421875, 26.112548828125, 26.7281494140625, 27.34375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 11.0, 14.0, 43.0, 131.0, 358.0, 1623.0, 11940.0, 528118.0, 3604638.0, 42888.0, 3452.0, 701.0, 197.0, 72.0, 32.0, 24.0, 8.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.548828125, -23.53515625, -22.521484375, -21.5078125, -20.494140625, -19.48046875, -18.466796875, -17.453125, -16.439453125, -15.42578125, -14.412109375, -13.3984375, -12.384765625, -11.37109375, -10.357421875, -9.34375, -8.330078125, -7.31640625, -6.302734375, -5.2890625, -4.275390625, -3.26171875, -2.248046875, -1.234375, -0.220703125, 0.79296875, 1.806640625, 2.8203125, 3.833984375, 4.84765625, 5.861328125, 6.875, 7.888671875, 8.90234375, 9.916015625, 10.9296875, 11.943359375, 12.95703125, 13.970703125, 14.984375, 15.998046875, 17.01171875, 18.025390625, 19.0390625, 20.052734375, 21.06640625, 22.080078125, 23.09375, 24.107421875, 25.12109375, 26.134765625, 27.1484375, 28.162109375, 29.17578125, 30.189453125, 31.203125, 32.216796875, 33.23046875, 34.244140625, 35.2578125, 36.271484375, 37.28515625, 38.298828125, 39.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 12.0, 15.0, 29.0, 56.0, 85.0, 121.0, 143.0, 152.0, 120.0, 111.0, 71.0, 42.0, 18.0, 13.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.779624938964844, -55.160125732421875, -51.54062271118164, -47.92112350463867, -44.30162048339844, -40.68212127685547, -37.0626220703125, -33.44312286376953, -29.823619842529297, -26.204118728637695, -22.584617614746094, -18.965118408203125, -15.345617294311523, -11.726116180419922, -8.106616973876953, -4.487115859985352, -0.86761474609375, 2.7518858909606934, 6.371386528015137, 9.990886688232422, 13.610387802124023, 17.229888916015625, 20.849388122558594, 24.468889236450195, 28.088390350341797, 31.7078914642334, 35.327392578125, 38.94689178466797, 42.56639099121094, 46.18589401245117, 49.80539321899414, 53.424896240234375, 57.044403076171875, 60.663902282714844, 64.28340148925781, 67.90290832519531, 71.52240753173828, 75.14190673828125, 78.76140594482422, 82.38090515136719, 86.00041198730469, 89.61991119384766, 93.23941040039062, 96.85891723632812, 100.4784164428711, 104.09791564941406, 107.71741485595703, 111.3369140625, 114.95641326904297, 118.57591247558594, 122.1954116821289, 125.81491088867188, 129.43441772460938, 133.05392456054688, 136.6734161376953, 140.2929229736328, 143.91241455078125, 147.53192138671875, 151.1514129638672, 154.7709197998047, 158.39041137695312, 162.00991821289062, 165.62942504882812, 169.24891662597656, 172.86842346191406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 16.0, 21.0, 17.0, 30.0, 41.0, 34.0, 41.0, 64.0, 47.0, 56.0, 62.0, 61.0, 67.0, 56.0, 48.0, 55.0, 48.0, 45.0, 40.0, 26.0, 24.0, 16.0, 9.0, 25.0, 10.0, 12.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.016571044921875, -58.14812088012695, -56.27967071533203, -54.41122055053711, -52.54277038574219, -50.67432403564453, -48.805870056152344, -46.93742370605469, -45.068973541259766, -43.200523376464844, -41.33207321166992, -39.463623046875, -37.59517288208008, -35.726722717285156, -33.8582763671875, -31.989826202392578, -30.121374130249023, -28.2529239654541, -26.38447380065918, -24.51602554321289, -22.64757537841797, -20.779125213623047, -18.910675048828125, -17.042224884033203, -15.173775672912598, -13.305325508117676, -11.43687629699707, -9.568426132202148, -7.699976444244385, -5.831526756286621, -3.963076591491699, -2.0946273803710938, -0.22617721557617188, 1.6422725915908813, 3.5107223987579346, 5.379172325134277, 7.247622013092041, 9.116071701049805, 10.984521865844727, 12.852971076965332, 14.721421241760254, 16.58987045288086, 18.45832061767578, 20.326770782470703, 22.195220947265625, 24.063671112060547, 25.93212127685547, 27.800569534301758, 29.66901969909668, 31.5374698638916, 33.40591812133789, 35.27436828613281, 37.142818450927734, 39.011268615722656, 40.87971878051758, 42.7481689453125, 44.61661911010742, 46.485069274902344, 48.353519439697266, 50.22196960449219, 52.09041976928711, 53.95886993408203, 55.82731628417969, 57.69576644897461, 59.56421661376953]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 15.0, 17.0, 27.0, 31.0, 44.0, 36.0, 67.0, 64.0, 61.0, 70.0, 78.0, 65.0, 74.0, 55.0, 63.0, 51.0, 52.0, 20.0, 19.0, 21.0, 16.0, 12.0, 16.0, 5.0, 7.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.625, -100.044921875, -96.46484375, -92.884765625, -89.3046875, -85.724609375, -82.14453125, -78.564453125, -74.984375, -71.404296875, -67.82421875, -64.244140625, -60.6640625, -57.083984375, -53.50390625, -49.923828125, -46.34375, -42.763671875, -39.18359375, -35.603515625, -32.0234375, -28.443359375, -24.86328125, -21.283203125, -17.703125, -14.123046875, -10.54296875, -6.962890625, -3.3828125, 0.197265625, 3.77734375, 7.357421875, 10.9375, 14.517578125, 18.09765625, 21.677734375, 25.2578125, 28.837890625, 32.41796875, 35.998046875, 39.578125, 43.158203125, 46.73828125, 50.318359375, 53.8984375, 57.478515625, 61.05859375, 64.638671875, 68.21875, 71.798828125, 75.37890625, 78.958984375, 82.5390625, 86.119140625, 89.69921875, 93.279296875, 96.859375, 100.439453125, 104.01953125, 107.599609375, 111.1796875, 114.759765625, 118.33984375, 121.919921875, 125.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 7.0, 11.0, 26.0, 30.0, 37.0, 80.0, 105.0, 121.0, 207.0, 307.0, 419.0, 613.0, 959.0, 1490.0, 2099.0, 3121.0, 4675.0, 6947.0, 10388.0, 16115.0, 24456.0, 36770.0, 56150.0, 82494.0, 115557.0, 148673.0, 151944.0, 121640.0, 86611.0, 59772.0, 39523.0, 26443.0, 17159.0, 11186.0, 7300.0, 4989.0, 3261.0, 2257.0, 1498.0, 995.0, 674.0, 442.0, 330.0, 218.0, 141.0, 108.0, 86.0, 42.0, 35.0, 17.0, 14.0, 12.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.96051025390625, -3.8194580078125, -3.67840576171875, -3.537353515625, -3.39630126953125, -3.2552490234375, -3.11419677734375, -2.97314453125, -2.83209228515625, -2.6910400390625, -2.54998779296875, -2.408935546875, -2.26788330078125, -2.1268310546875, -1.98577880859375, -1.8447265625, -1.70367431640625, -1.5626220703125, -1.42156982421875, -1.280517578125, -1.13946533203125, -0.9984130859375, -0.85736083984375, -0.71630859375, -0.57525634765625, -0.4342041015625, -0.29315185546875, -0.152099609375, -0.01104736328125, 0.1300048828125, 0.27105712890625, 0.412109375, 0.55316162109375, 0.6942138671875, 0.83526611328125, 0.976318359375, 1.11737060546875, 1.2584228515625, 1.39947509765625, 1.54052734375, 1.68157958984375, 1.8226318359375, 1.96368408203125, 2.104736328125, 2.24578857421875, 2.3868408203125, 2.52789306640625, 2.6689453125, 2.80999755859375, 2.9510498046875, 3.09210205078125, 3.233154296875, 3.37420654296875, 3.5152587890625, 3.65631103515625, 3.79736328125, 3.93841552734375, 4.0794677734375, 4.22052001953125, 4.361572265625, 4.50262451171875, 4.6436767578125, 4.78472900390625, 4.92578125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 7.0, 7.0, 13.0, 16.0, 23.0, 26.0, 30.0, 35.0, 31.0, 32.0, 36.0, 35.0, 47.0, 51.0, 60.0, 1079.0, 47.0, 54.0, 50.0, 40.0, 38.0, 39.0, 34.0, 33.0, 24.0, 27.0, 18.0, 17.0, 14.0, 9.0, 7.0, 8.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-58.96875, -57.3046875, -55.640625, -53.9765625, -52.3125, -50.6484375, -48.984375, -47.3203125, -45.65625, -43.9921875, -42.328125, -40.6640625, -39.0, -37.3359375, -35.671875, -34.0078125, -32.34375, -30.6796875, -29.015625, -27.3515625, -25.6875, -24.0234375, -22.359375, -20.6953125, -19.03125, -17.3671875, -15.703125, -14.0390625, -12.375, -10.7109375, -9.046875, -7.3828125, -5.71875, -4.0546875, -2.390625, -0.7265625, 0.9375, 2.6015625, 4.265625, 5.9296875, 7.59375, 9.2578125, 10.921875, 12.5859375, 14.25, 15.9140625, 17.578125, 19.2421875, 20.90625, 22.5703125, 24.234375, 25.8984375, 27.5625, 29.2265625, 30.890625, 32.5546875, 34.21875, 35.8828125, 37.546875, 39.2109375, 40.875, 42.5390625, 44.203125, 45.8671875, 47.53125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 0.0, 8.0, 17.0, 21.0, 34.0, 56.0, 73.0, 124.0, 184.0, 246.0, 412.0, 571.0, 915.0, 1358.0, 2145.0, 3161.0, 4956.0, 7551.0, 11899.0, 18524.0, 29348.0, 45965.0, 72437.0, 108975.0, 147532.0, 1212034.0, 141241.0, 102002.0, 67003.0, 42992.0, 27010.0, 17129.0, 10892.0, 7036.0, 4635.0, 3057.0, 1918.0, 1240.0, 817.0, 539.0, 369.0, 249.0, 166.0, 109.0, 64.0, 50.0, 24.0, 10.0, 19.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.9765625, -4.82763671875, -4.6787109375, -4.52978515625, -4.380859375, -4.23193359375, -4.0830078125, -3.93408203125, -3.78515625, -3.63623046875, -3.4873046875, -3.33837890625, -3.189453125, -3.04052734375, -2.8916015625, -2.74267578125, -2.59375, -2.44482421875, -2.2958984375, -2.14697265625, -1.998046875, -1.84912109375, -1.7001953125, -1.55126953125, -1.40234375, -1.25341796875, -1.1044921875, -0.95556640625, -0.806640625, -0.65771484375, -0.5087890625, -0.35986328125, -0.2109375, -0.06201171875, 0.0869140625, 0.23583984375, 0.384765625, 0.53369140625, 0.6826171875, 0.83154296875, 0.98046875, 1.12939453125, 1.2783203125, 1.42724609375, 1.576171875, 1.72509765625, 1.8740234375, 2.02294921875, 2.171875, 2.32080078125, 2.4697265625, 2.61865234375, 2.767578125, 2.91650390625, 3.0654296875, 3.21435546875, 3.36328125, 3.51220703125, 3.6611328125, 3.81005859375, 3.958984375, 4.10791015625, 4.2568359375, 4.40576171875, 4.5546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 8.0, 4.0, 16.0, 13.0, 12.0, 19.0, 20.0, 26.0, 22.0, 26.0, 36.0, 35.0, 44.0, 51.0, 46.0, 58.0, 43.0, 61.0, 50.0, 54.0, 43.0, 39.0, 43.0, 31.0, 27.0, 14.0, 28.0, 18.0, 24.0, 13.0, 12.0, 15.0, 10.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03857421875, -0.0370182991027832, -0.035462379455566406, -0.03390645980834961, -0.03235054016113281, -0.030794620513916016, -0.02923870086669922, -0.027682781219482422, -0.026126861572265625, -0.024570941925048828, -0.02301502227783203, -0.021459102630615234, -0.019903182983398438, -0.01834726333618164, -0.016791343688964844, -0.015235424041748047, -0.01367950439453125, -0.012123584747314453, -0.010567665100097656, -0.00901174545288086, -0.0074558258056640625, -0.005899906158447266, -0.004343986511230469, -0.002788066864013672, -0.001232147216796875, 0.0003237724304199219, 0.0018796920776367188, 0.0034356117248535156, 0.0049915313720703125, 0.006547451019287109, 0.008103370666503906, 0.009659290313720703, 0.0112152099609375, 0.012771129608154297, 0.014327049255371094, 0.01588296890258789, 0.017438888549804688, 0.018994808197021484, 0.02055072784423828, 0.022106647491455078, 0.023662567138671875, 0.025218486785888672, 0.02677440643310547, 0.028330326080322266, 0.029886245727539062, 0.03144216537475586, 0.032998085021972656, 0.03455400466918945, 0.03610992431640625, 0.03766584396362305, 0.039221763610839844, 0.04077768325805664, 0.04233360290527344, 0.043889522552490234, 0.04544544219970703, 0.04700136184692383, 0.048557281494140625, 0.05011320114135742, 0.05166912078857422, 0.053225040435791016, 0.05478096008300781, 0.05633687973022461, 0.057892799377441406, 0.0594487190246582, 0.061004638671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 13.0, 20.0, 17.0, 34.0, 33.0, 71.0, 80.0, 120.0, 164.0, 217.0, 299.0, 448.0, 818.0, 1456.0, 3103.0, 7092.0, 18668.0, 57645.0, 235257.0, 517072.0, 142015.0, 39340.0, 13687.0, 5299.0, 2388.0, 1163.0, 668.0, 389.0, 293.0, 204.0, 132.0, 109.0, 63.0, 56.0, 33.0, 26.0, 21.0, 8.0, 6.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.351806640625, -0.34238433837890625, -0.3329620361328125, -0.32353973388671875, -0.314117431640625, -0.30469512939453125, -0.2952728271484375, -0.28585052490234375, -0.27642822265625, -0.26700592041015625, -0.2575836181640625, -0.24816131591796875, -0.238739013671875, -0.22931671142578125, -0.2198944091796875, -0.21047210693359375, -0.2010498046875, -0.19162750244140625, -0.1822052001953125, -0.17278289794921875, -0.163360595703125, -0.15393829345703125, -0.1445159912109375, -0.13509368896484375, -0.12567138671875, -0.11624908447265625, -0.1068267822265625, -0.09740447998046875, -0.087982177734375, -0.07855987548828125, -0.0691375732421875, -0.05971527099609375, -0.05029296875, -0.04087066650390625, -0.0314483642578125, -0.02202606201171875, -0.012603759765625, -0.00318145751953125, 0.0062408447265625, 0.01566314697265625, 0.02508544921875, 0.03450775146484375, 0.0439300537109375, 0.05335235595703125, 0.062774658203125, 0.07219696044921875, 0.0816192626953125, 0.09104156494140625, 0.1004638671875, 0.10988616943359375, 0.1193084716796875, 0.12873077392578125, 0.138153076171875, 0.14757537841796875, 0.1569976806640625, 0.16641998291015625, 0.17584228515625, 0.18526458740234375, 0.1946868896484375, 0.20410919189453125, 0.213531494140625, 0.22295379638671875, 0.2323760986328125, 0.24179840087890625, 0.251220703125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 9.0, 4.0, 9.0, 8.0, 12.0, 18.0, 17.0, 21.0, 32.0, 56.0, 59.0, 90.0, 81.0, 93.0, 95.0, 89.0, 73.0, 63.0, 48.0, 25.0, 28.0, 19.0, 9.0, 7.0, 10.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03601740300655365, -0.03450973704457283, -0.03300207108259201, -0.03149440884590149, -0.02998674288392067, -0.02847907692193985, -0.02697141282260418, -0.02546374872326851, -0.02395608276128769, -0.02244841679930687, -0.0209407526999712, -0.01943308860063553, -0.01792542263865471, -0.01641775667667389, -0.014910092577338219, -0.013402427546679974, -0.011894762516021729, -0.010387097485363483, -0.008879432454705238, -0.007371767424046993, -0.005864102393388748, -0.004356437362730503, -0.002848772332072258, -0.001341107301414013, 0.00016655772924423218, 0.0016742227599024773, 0.0031818877905607224, 0.0046895528212189674, 0.0061972178518772125, 0.007704882882535458, 0.009212547913193703, 0.010720212943851948, 0.012227877974510193, 0.013735543005168438, 0.015243208035826683, 0.016750872135162354, 0.018258538097143173, 0.019766204059123993, 0.021273868158459663, 0.022781532257795334, 0.024289198219776154, 0.025796864181756973, 0.027304528281092644, 0.028812192380428314, 0.030319858342409134, 0.031827524304389954, 0.033335186541080475, 0.034842852503061295, 0.036350518465042114, 0.037858184427022934, 0.039365850389003754, 0.040873512625694275, 0.042381178587675095, 0.043888844549655914, 0.045396506786346436, 0.046904172748327255, 0.048411838710308075, 0.049919504672288895, 0.051427170634269714, 0.052934832870960236, 0.054442498832941055, 0.055950164794921875, 0.057457827031612396, 0.058965492993593216, 0.060473158955574036]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 9.0, 3.0, 11.0, 15.0, 18.0, 18.0, 19.0, 29.0, 22.0, 38.0, 33.0, 35.0, 33.0, 46.0, 30.0, 51.0, 45.0, 41.0, 48.0, 47.0, 32.0, 34.0, 27.0, 40.0, 24.0, 31.0, 31.0, 31.0, 32.0, 23.0, 15.0, 16.0, 18.0, 13.0, 6.0, 4.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03325134515762329, -0.032247722148895264, -0.031244101002812386, -0.030240479856729507, -0.02923685684800148, -0.028233233839273453, -0.027229612693190575, -0.026225991547107697, -0.02522236853837967, -0.024218745529651642, -0.023215124383568764, -0.022211503237485886, -0.02120788022875786, -0.02020425722002983, -0.019200636073946953, -0.018197014927864075, -0.017193391919136047, -0.01618976891040802, -0.015186147764325142, -0.01418252568691969, -0.013178903609514236, -0.012175281532108784, -0.011171659454703331, -0.010168037377297878, -0.009164415299892426, -0.008160793222486973, -0.00715717114508152, -0.006153549067676067, -0.005149926990270615, -0.004146304912865162, -0.003142682835459709, -0.0021390607580542564, -0.0011354386806488037, -0.00013181660324335098, 0.0008718054741621017, 0.0018754275515675545, 0.002879049628973007, 0.00388267170637846, 0.004886293783783913, 0.005889915861189365, 0.006893537938594818, 0.00789716001600027, 0.008900782093405724, 0.009904404170811176, 0.010908026248216629, 0.011911648325622082, 0.012915270403027534, 0.013918892480432987, 0.01492251455783844, 0.015926137566566467, 0.016929758712649345, 0.017933379858732224, 0.01893700286746025, 0.019940625876188278, 0.020944247022271156, 0.021947868168354034, 0.022951491177082062, 0.02395511418581009, 0.024958735331892967, 0.025962356477975845, 0.026965979486703873, 0.0279696024954319, 0.028973223641514778, 0.029976844787597656, 0.030980467796325684]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 15.0, 17.0, 26.0, 30.0, 46.0, 34.0, 67.0, 63.0, 63.0, 70.0, 74.0, 69.0, 74.0, 55.0, 63.0, 50.0, 53.0, 22.0, 18.0, 21.0, 16.0, 12.0, 14.0, 6.0, 8.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.875, -100.2890625, -96.703125, -93.1171875, -89.53125, -85.9453125, -82.359375, -78.7734375, -75.1875, -71.6015625, -68.015625, -64.4296875, -60.84375, -57.2578125, -53.671875, -50.0859375, -46.5, -42.9140625, -39.328125, -35.7421875, -32.15625, -28.5703125, -24.984375, -21.3984375, -17.8125, -14.2265625, -10.640625, -7.0546875, -3.46875, 0.1171875, 3.703125, 7.2890625, 10.875, 14.4609375, 18.046875, 21.6328125, 25.21875, 28.8046875, 32.390625, 35.9765625, 39.5625, 43.1484375, 46.734375, 50.3203125, 53.90625, 57.4921875, 61.078125, 64.6640625, 68.25, 71.8359375, 75.421875, 79.0078125, 82.59375, 86.1796875, 89.765625, 93.3515625, 96.9375, 100.5234375, 104.109375, 107.6953125, 111.28125, 114.8671875, 118.453125, 122.0390625, 125.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 18.0, 25.0, 35.0, 56.0, 103.0, 177.0, 325.0, 793.0, 1966.0, 5432.0, 23050.0, 257912.0, 687421.0, 56869.0, 9456.0, 2776.0, 1091.0, 462.0, 212.0, 126.0, 82.0, 46.0, 39.0, 19.0, 14.0, 15.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.875, -24.9580078125, -24.041015625, -23.1240234375, -22.20703125, -21.2900390625, -20.373046875, -19.4560546875, -18.5390625, -17.6220703125, -16.705078125, -15.7880859375, -14.87109375, -13.9541015625, -13.037109375, -12.1201171875, -11.203125, -10.2861328125, -9.369140625, -8.4521484375, -7.53515625, -6.6181640625, -5.701171875, -4.7841796875, -3.8671875, -2.9501953125, -2.033203125, -1.1162109375, -0.19921875, 0.7177734375, 1.634765625, 2.5517578125, 3.46875, 4.3857421875, 5.302734375, 6.2197265625, 7.13671875, 8.0537109375, 8.970703125, 9.8876953125, 10.8046875, 11.7216796875, 12.638671875, 13.5556640625, 14.47265625, 15.3896484375, 16.306640625, 17.2236328125, 18.140625, 19.0576171875, 19.974609375, 20.8916015625, 21.80859375, 22.7255859375, 23.642578125, 24.5595703125, 25.4765625, 26.3935546875, 27.310546875, 28.2275390625, 29.14453125, 30.0615234375, 30.978515625, 31.8955078125, 32.8125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 13.0, 15.0, 18.0, 49.0, 43.0, 50.0, 72.0, 66.0, 87.0, 2125.0, 101.0, 86.0, 57.0, 72.0, 47.0, 37.0, 31.0, 22.0, 14.0, 5.0, 10.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.75, -135.26953125, -129.7890625, -124.30859375, -118.828125, -113.34765625, -107.8671875, -102.38671875, -96.90625, -91.42578125, -85.9453125, -80.46484375, -74.984375, -69.50390625, -64.0234375, -58.54296875, -53.0625, -47.58203125, -42.1015625, -36.62109375, -31.140625, -25.66015625, -20.1796875, -14.69921875, -9.21875, -3.73828125, 1.7421875, 7.22265625, 12.703125, 18.18359375, 23.6640625, 29.14453125, 34.625, 40.10546875, 45.5859375, 51.06640625, 56.546875, 62.02734375, 67.5078125, 72.98828125, 78.46875, 83.94921875, 89.4296875, 94.91015625, 100.390625, 105.87109375, 111.3515625, 116.83203125, 122.3125, 127.79296875, 133.2734375, 138.75390625, 144.234375, 149.71484375, 155.1953125, 160.67578125, 166.15625, 171.63671875, 177.1171875, 182.59765625, 188.078125, 193.55859375, 199.0390625, 204.51953125, 210.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 12.0, 22.0, 22.0, 38.0, 53.0, 78.0, 144.0, 215.0, 316.0, 586.0, 1313.0, 3969.0, 34940.0, 2849714.0, 238521.0, 11329.0, 2339.0, 853.0, 443.0, 252.0, 184.0, 104.0, 70.0, 36.0, 36.0, 32.0, 15.0, 13.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.09375, -36.05712890625, -35.0205078125, -33.98388671875, -32.947265625, -31.91064453125, -30.8740234375, -29.83740234375, -28.80078125, -27.76416015625, -26.7275390625, -25.69091796875, -24.654296875, -23.61767578125, -22.5810546875, -21.54443359375, -20.5078125, -19.47119140625, -18.4345703125, -17.39794921875, -16.361328125, -15.32470703125, -14.2880859375, -13.25146484375, -12.21484375, -11.17822265625, -10.1416015625, -9.10498046875, -8.068359375, -7.03173828125, -5.9951171875, -4.95849609375, -3.921875, -2.88525390625, -1.8486328125, -0.81201171875, 0.224609375, 1.26123046875, 2.2978515625, 3.33447265625, 4.37109375, 5.40771484375, 6.4443359375, 7.48095703125, 8.517578125, 9.55419921875, 10.5908203125, 11.62744140625, 12.6640625, 13.70068359375, 14.7373046875, 15.77392578125, 16.810546875, 17.84716796875, 18.8837890625, 19.92041015625, 20.95703125, 21.99365234375, 23.0302734375, 24.06689453125, 25.103515625, 26.14013671875, 27.1767578125, 28.21337890625, 29.25]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 4.0, 6.0, 9.0, 15.0, 26.0, 49.0, 91.0, 144.0, 188.0, 152.0, 123.0, 67.0, 44.0, 25.0, 14.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.95148468017578, -70.04188537597656, -64.13228607177734, -58.22269058227539, -52.31309509277344, -46.40349578857422, -40.493896484375, -34.58430099487305, -28.674701690673828, -22.765104293823242, -16.855506896972656, -10.945907592773438, -5.036310195922852, 0.8732872009277344, 6.782886505126953, 12.692481994628906, 18.602081298828125, 24.51167869567871, 30.421276092529297, 36.330875396728516, 42.24047088623047, 48.15007019042969, 54.059669494628906, 59.96926498413086, 65.87886047363281, 71.78845977783203, 77.69805908203125, 83.60765075683594, 89.51725006103516, 95.42684936523438, 101.3364486694336, 107.24604797363281, 113.15565490722656, 119.06525421142578, 124.974853515625, 130.8844451904297, 136.79405212402344, 142.70364379882812, 148.61325073242188, 154.52284240722656, 160.43243408203125, 166.34202575683594, 172.2516326904297, 178.16122436523438, 184.07083129882812, 189.9804229736328, 195.8900146484375, 201.79962158203125, 207.709228515625, 213.6188201904297, 219.52842712402344, 225.43801879882812, 231.34762573242188, 237.25721740722656, 243.16680908203125, 249.076416015625, 254.9860076904297, 260.8955993652344, 266.8052062988281, 272.7148132324219, 278.6243896484375, 284.53399658203125, 290.443603515625, 296.3531799316406, 302.2627868652344]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 6.0, 6.0, 14.0, 11.0, 15.0, 18.0, 33.0, 21.0, 31.0, 45.0, 30.0, 52.0, 44.0, 61.0, 51.0, 52.0, 34.0, 43.0, 55.0, 59.0, 37.0, 32.0, 34.0, 38.0, 29.0, 22.0, 24.0, 17.0, 19.0, 13.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-171.99749755859375, -167.3218231201172, -162.6461639404297, -157.97048950195312, -153.29481506347656, -148.619140625, -143.9434814453125, -139.26780700683594, -134.59213256835938, -129.9164581298828, -125.24079132080078, -120.56512451171875, -115.88945007324219, -111.21378326416016, -106.53811645507812, -101.86244201660156, -97.18678283691406, -92.51111602783203, -87.83544158935547, -83.15977478027344, -78.48410034179688, -73.80843353271484, -69.13276672363281, -64.45709228515625, -59.78142547607422, -55.10575485229492, -50.430084228515625, -45.754417419433594, -41.0787467956543, -36.403076171875, -31.727407455444336, -27.051738739013672, -22.376052856445312, -17.700382232666016, -13.024713516235352, -8.349043846130371, -3.6733741760253906, 1.0022964477539062, 5.67796516418457, 10.353633880615234, 15.029304504394531, 19.704975128173828, 24.380643844604492, 29.056312561035156, 33.73198318481445, 38.40765380859375, 43.08332061767578, 47.75899124145508, 52.434661865234375, 57.11033248901367, 61.78600311279297, 66.461669921875, 71.13734436035156, 75.8130111694336, 80.48867797851562, 85.16435241699219, 89.84001922607422, 94.51568603515625, 99.19136047363281, 103.86702728271484, 108.54269409179688, 113.21836853027344, 117.89403533935547, 122.5697021484375, 127.24537658691406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 10.0, 9.0, 15.0, 14.0, 14.0, 23.0, 36.0, 48.0, 45.0, 83.0, 134.0, 126.0, 217.0, 271.0, 329.0, 504.0, 709.0, 1110.0, 1040201.0, 1486.0, 913.0, 553.0, 414.0, 333.0, 252.0, 196.0, 131.0, 107.0, 68.0, 39.0, 44.0, 29.0, 21.0, 14.0, 14.0, 13.0, 14.0, 4.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.27141571044922, -42.73384094238281, -41.19626235961914, -39.65868377685547, -38.12110900878906, -36.583534240722656, -35.045955657958984, -33.50837707519531, -31.970802307128906, -30.433225631713867, -28.895648956298828, -27.35807228088379, -25.82049560546875, -24.28291893005371, -22.745342254638672, -21.207765579223633, -19.670188903808594, -18.132612228393555, -16.595035552978516, -15.057458877563477, -13.519882202148438, -11.982305526733398, -10.44472885131836, -8.90715217590332, -7.369575500488281, -5.831998825073242, -4.294422149658203, -2.756845474243164, -1.219268798828125, 0.31830787658691406, 1.8558845520019531, 3.393461227416992, 4.931041717529297, 6.468618392944336, 8.006195068359375, 9.543771743774414, 11.081348419189453, 12.618925094604492, 14.156501770019531, 15.69407844543457, 17.23165512084961, 18.76923179626465, 20.306808471679688, 21.844385147094727, 23.381961822509766, 24.919538497924805, 26.457115173339844, 27.994691848754883, 29.532268524169922, 31.06984519958496, 32.607421875, 34.144996643066406, 35.68257522583008, 37.22015380859375, 38.757728576660156, 40.29530334472656, 41.832881927490234, 43.370460510253906, 44.90803527832031, 46.44561004638672, 47.98318862915039, 49.52076721191406, 51.05834197998047, 52.595916748046875, 54.13349533081055]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 11.0, 15.0, 14.0, 42.0, 129.0, 58874.0, 51404756.0, 70.0, 25.0, 17.0, 12.0, 13.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4105.43603515625, -3963.91357421875, -3822.390869140625, -3680.868408203125, -3539.345703125, -3397.8232421875, -3256.30078125, -3114.7783203125, -2973.255615234375, -2831.733154296875, -2690.21044921875, -2548.68798828125, -2407.16552734375, -2265.642822265625, -2124.120361328125, -1982.5977783203125, -1841.0751953125, -1699.5526123046875, -1558.030029296875, -1416.507568359375, -1274.9849853515625, -1133.46240234375, -991.9398803710938, -850.4173583984375, -708.894775390625, -567.3721923828125, -425.84967041015625, -284.3271179199219, -142.8045654296875, -1.281982421875, 140.24053955078125, 281.7630615234375, 423.28515625, 564.8077392578125, 706.3302612304688, 847.852783203125, 989.3753662109375, 1130.89794921875, 1272.42041015625, 1413.9429931640625, 1555.465576171875, 1696.9881591796875, 1838.5107421875, 1980.033203125, 2121.5556640625, 2263.078369140625, 2404.600830078125, 2546.12353515625, 2687.64599609375, 2829.16845703125, 2970.691162109375, 3112.213623046875, 3253.736328125, 3395.2587890625, 3536.78125, 3678.3037109375, 3819.826416015625, 3961.348876953125, 4102.87158203125, 4244.39404296875, 4385.91650390625, 4527.439453125, 4668.9619140625, 4810.484375, 4952.0068359375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 13.0, 14.0, 20.0, 30.0, 56.0, 69.0, 105.0, 173.0, 231.0, 335.0, 544.0, 744.0, 1151.0, 1702.0, 2766.0, 4484.0, 7494.0, 12205.0, 20552.0, 35215.0, 59953.0, 102384.0, 173379.0, 282466.0, 417777.0, 3201590.0, 959182.0, 382700.0, 251184.0, 152868.0, 90141.0, 52399.0, 30497.0, 18303.0, 10809.0, 6669.0, 4008.0, 2498.0, 1555.0, 1064.0, 716.0, 470.0, 303.0, 190.0, 136.0, 82.0, 57.0, 43.0, 33.0, 17.0, 24.0, 6.0, 8.0, 8.0, 4.0, 3.0], "bins": [-2.1875, -2.1229248046875, -2.058349609375, -1.9937744140625, -1.92919921875, -1.8646240234375, -1.800048828125, -1.7354736328125, -1.6708984375, -1.6063232421875, -1.541748046875, -1.4771728515625, -1.41259765625, -1.3480224609375, -1.283447265625, -1.2188720703125, -1.154296875, -1.0897216796875, -1.025146484375, -0.9605712890625, -0.89599609375, -0.8314208984375, -0.766845703125, -0.7022705078125, -0.6376953125, -0.5731201171875, -0.508544921875, -0.4439697265625, -0.37939453125, -0.3148193359375, -0.250244140625, -0.1856689453125, -0.12109375, -0.0565185546875, 0.008056640625, 0.0726318359375, 0.13720703125, 0.2017822265625, 0.266357421875, 0.3309326171875, 0.3955078125, 0.4600830078125, 0.524658203125, 0.5892333984375, 0.65380859375, 0.7183837890625, 0.782958984375, 0.8475341796875, 0.912109375, 0.9766845703125, 1.041259765625, 1.1058349609375, 1.17041015625, 1.2349853515625, 1.299560546875, 1.3641357421875, 1.4287109375, 1.4932861328125, 1.557861328125, 1.6224365234375, 1.68701171875, 1.7515869140625, 1.816162109375, 1.8807373046875, 1.9453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 7.0, 9.0, 6.0, 11.0, 9.0, 16.0, 19.0, 12.0, 13.0, 20.0, 25.0, 30.0, 37.0, 32.0, 30.0, 29.0, 37.0, 45.0, 37.0, 79.0, 872.0, 185.0, 40.0, 40.0, 44.0, 40.0, 40.0, 30.0, 23.0, 34.0, 22.0, 30.0, 27.0, 22.0, 15.0, 14.0, 12.0, 6.0, 4.0, 2.0, 7.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.890625, -15.418212890625, -14.94580078125, -14.473388671875, -14.0009765625, -13.528564453125, -13.05615234375, -12.583740234375, -12.111328125, -11.638916015625, -11.16650390625, -10.694091796875, -10.2216796875, -9.749267578125, -9.27685546875, -8.804443359375, -8.33203125, -7.859619140625, -7.38720703125, -6.914794921875, -6.4423828125, -5.969970703125, -5.49755859375, -5.025146484375, -4.552734375, -4.080322265625, -3.60791015625, -3.135498046875, -2.6630859375, -2.190673828125, -1.71826171875, -1.245849609375, -0.7734375, -0.301025390625, 0.17138671875, 0.643798828125, 1.1162109375, 1.588623046875, 2.06103515625, 2.533447265625, 3.005859375, 3.478271484375, 3.95068359375, 4.423095703125, 4.8955078125, 5.367919921875, 5.84033203125, 6.312744140625, 6.78515625, 7.257568359375, 7.72998046875, 8.202392578125, 8.6748046875, 9.147216796875, 9.61962890625, 10.092041015625, 10.564453125, 11.036865234375, 11.50927734375, 11.981689453125, 12.4541015625, 12.926513671875, 13.39892578125, 13.871337890625, 14.34375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 7.0, 4.0, 10.0, 19.0, 19.0, 29.0, 52.0, 98.0, 113.0, 157.0, 244.0, 329.0, 511.0, 728.0, 1161.0, 1728.0, 2584.0, 4076.0, 6352.0, 9838.0, 15993.0, 25672.0, 42560.0, 70405.0, 120168.0, 204843.0, 336487.0, 542774.0, 3613514.0, 497772.0, 317424.0, 191038.0, 112566.0, 66535.0, 39693.0, 24000.0, 15111.0, 9401.0, 5972.0, 3994.0, 2528.0, 1678.0, 1114.0, 734.0, 449.0, 315.0, 223.0, 143.0, 84.0, 56.0, 45.0, 33.0, 21.0, 18.0, 12.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0], "bins": [-2.240234375, -2.168975830078125, -2.09771728515625, -2.026458740234375, -1.9552001953125, -1.883941650390625, -1.81268310546875, -1.741424560546875, -1.670166015625, -1.598907470703125, -1.52764892578125, -1.456390380859375, -1.3851318359375, -1.313873291015625, -1.24261474609375, -1.171356201171875, -1.10009765625, -1.028839111328125, -0.95758056640625, -0.886322021484375, -0.8150634765625, -0.743804931640625, -0.67254638671875, -0.601287841796875, -0.530029296875, -0.458770751953125, -0.38751220703125, -0.316253662109375, -0.2449951171875, -0.173736572265625, -0.10247802734375, -0.031219482421875, 0.0400390625, 0.111297607421875, 0.18255615234375, 0.253814697265625, 0.3250732421875, 0.396331787109375, 0.46759033203125, 0.538848876953125, 0.610107421875, 0.681365966796875, 0.75262451171875, 0.823883056640625, 0.8951416015625, 0.966400146484375, 1.03765869140625, 1.108917236328125, 1.18017578125, 1.251434326171875, 1.32269287109375, 1.393951416015625, 1.4652099609375, 1.536468505859375, 1.60772705078125, 1.678985595703125, 1.750244140625, 1.821502685546875, 1.89276123046875, 1.964019775390625, 2.0352783203125, 2.106536865234375, 2.17779541015625, 2.249053955078125, 2.3203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 6.0, 10.0, 7.0, 8.0, 14.0, 19.0, 14.0, 14.0, 15.0, 28.0, 28.0, 31.0, 25.0, 32.0, 33.0, 38.0, 37.0, 27.0, 44.0, 161.0, 827.0, 141.0, 39.0, 32.0, 33.0, 47.0, 39.0, 32.0, 23.0, 27.0, 23.0, 29.0, 18.0, 15.0, 19.0, 15.0, 11.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.3671875, -8.0625, -7.7578125, -7.453125, -7.1484375, -6.84375, -6.5390625, -6.234375, -5.9296875, -5.625, -5.3203125, -5.015625, -4.7109375, -4.40625, -4.1015625, -3.796875, -3.4921875, -3.1875, -2.8828125, -2.578125, -2.2734375, -1.96875, -1.6640625, -1.359375, -1.0546875, -0.75, -0.4453125, -0.140625, 0.1640625, 0.46875, 0.7734375, 1.078125, 1.3828125, 1.6875, 1.9921875, 2.296875, 2.6015625, 2.90625, 3.2109375, 3.515625, 3.8203125, 4.125, 4.4296875, 4.734375, 5.0390625, 5.34375, 5.6484375, 5.953125, 6.2578125, 6.5625, 6.8671875, 7.171875, 7.4765625, 7.78125, 8.0859375, 8.390625, 8.6953125, 9.0, 9.3046875, 9.609375, 9.9140625, 10.21875, 10.5234375, 10.828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 6.0, 15.0, 20.0, 24.0, 31.0, 33.0, 48.0, 65.0, 89.0, 123.0, 160.0, 187.0, 243.0, 310.0, 455.0, 593.0, 852.0, 1275.0, 1760.0, 2953.0, 5090.0, 9493.0, 20386.0, 54960.0, 196961.0, 5797082.0, 123578.0, 38938.0, 15736.0, 7590.0, 4266.0, 2488.0, 1623.0, 1081.0, 704.0, 514.0, 411.0, 306.0, 225.0, 155.0, 157.0, 94.0, 86.0, 58.0, 52.0, 28.0, 28.0, 18.0, 11.0, 18.0, 9.0, 9.0, 9.0, 9.0, 5.0, 5.0, 3.0], "bins": [-9.6640625, -9.365234375, -9.06640625, -8.767578125, -8.46875, -8.169921875, -7.87109375, -7.572265625, -7.2734375, -6.974609375, -6.67578125, -6.376953125, -6.078125, -5.779296875, -5.48046875, -5.181640625, -4.8828125, -4.583984375, -4.28515625, -3.986328125, -3.6875, -3.388671875, -3.08984375, -2.791015625, -2.4921875, -2.193359375, -1.89453125, -1.595703125, -1.296875, -0.998046875, -0.69921875, -0.400390625, -0.1015625, 0.197265625, 0.49609375, 0.794921875, 1.09375, 1.392578125, 1.69140625, 1.990234375, 2.2890625, 2.587890625, 2.88671875, 3.185546875, 3.484375, 3.783203125, 4.08203125, 4.380859375, 4.6796875, 4.978515625, 5.27734375, 5.576171875, 5.875, 6.173828125, 6.47265625, 6.771484375, 7.0703125, 7.369140625, 7.66796875, 7.966796875, 8.265625, 8.564453125, 8.86328125, 9.162109375, 9.4609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 3.0, 6.0, 11.0, 8.0, 9.0, 15.0, 20.0, 14.0, 31.0, 34.0, 28.0, 42.0, 37.0, 37.0, 36.0, 49.0, 48.0, 153.0, 710.0, 245.0, 57.0, 62.0, 35.0, 48.0, 43.0, 40.0, 37.0, 26.0, 17.0, 25.0, 17.0, 23.0, 10.0, 9.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.34375, -9.08819580078125, -8.8326416015625, -8.57708740234375, -8.321533203125, -8.06597900390625, -7.8104248046875, -7.55487060546875, -7.29931640625, -7.04376220703125, -6.7882080078125, -6.53265380859375, -6.277099609375, -6.02154541015625, -5.7659912109375, -5.51043701171875, -5.2548828125, -4.99932861328125, -4.7437744140625, -4.48822021484375, -4.232666015625, -3.97711181640625, -3.7215576171875, -3.46600341796875, -3.21044921875, -2.95489501953125, -2.6993408203125, -2.44378662109375, -2.188232421875, -1.93267822265625, -1.6771240234375, -1.42156982421875, -1.166015625, -0.91046142578125, -0.6549072265625, -0.39935302734375, -0.143798828125, 0.11175537109375, 0.3673095703125, 0.62286376953125, 0.87841796875, 1.13397216796875, 1.3895263671875, 1.64508056640625, 1.900634765625, 2.15618896484375, 2.4117431640625, 2.66729736328125, 2.9228515625, 3.17840576171875, 3.4339599609375, 3.68951416015625, 3.945068359375, 4.20062255859375, 4.4561767578125, 4.71173095703125, 4.96728515625, 5.22283935546875, 5.4783935546875, 5.73394775390625, 5.989501953125, 6.24505615234375, 6.5006103515625, 6.75616455078125, 7.01171875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 23.0, 72.0, 205.0, 383.0, 217.0, 66.0, 22.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.21373748779297, -21.60333824157715, -19.992938995361328, -18.382539749145508, -16.772140502929688, -15.161742210388184, -13.551342964172363, -11.940943717956543, -10.330544471740723, -8.720145225524902, -7.109745979309082, -5.49934720993042, -3.8889479637145996, -2.2785491943359375, -0.6681499481201172, 0.9422492980957031, 2.5526485443115234, 4.163047790527344, 5.773447036743164, 7.383845806121826, 8.994245529174805, 10.604643821716309, 12.215043067932129, 13.82544231414795, 15.43584156036377, 17.046239852905273, 18.656639099121094, 20.267038345336914, 21.877437591552734, 23.487836837768555, 25.098236083984375, 26.708635330200195, 28.319034576416016, 29.929433822631836, 31.539833068847656, 33.150230407714844, 34.7606315612793, 36.371028900146484, 37.98143005371094, 39.591827392578125, 41.20222854614258, 42.812625885009766, 44.42302703857422, 46.033424377441406, 47.64382553100586, 49.25422286987305, 50.8646240234375, 52.47502136230469, 54.085418701171875, 55.69581604003906, 57.306217193603516, 58.9166145324707, 60.527015686035156, 62.137413024902344, 63.7478141784668, 65.35821533203125, 66.96861267089844, 68.57901000976562, 70.18940734863281, 71.79981231689453, 73.41020965576172, 75.0206069946289, 76.6310043334961, 78.24140930175781, 79.851806640625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 10.0, 8.0, 14.0, 14.0, 9.0, 17.0, 17.0, 27.0, 42.0, 33.0, 36.0, 28.0, 51.0, 47.0, 41.0, 37.0, 44.0, 40.0, 33.0, 46.0, 48.0, 46.0, 37.0, 32.0, 34.0, 27.0, 27.0, 20.0, 20.0, 20.0, 13.0, 16.0, 8.0, 13.0, 7.0, 8.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.829414367675781, -11.450998306274414, -11.072583198547363, -10.694167137145996, -10.315752029418945, -9.937335968017578, -9.558919906616211, -9.180503845214844, -8.802088737487793, -8.423672676086426, -8.045257568359375, -7.666841506958008, -7.288425922393799, -6.91001033782959, -6.531594276428223, -6.153178691864014, -5.774763107299805, -5.396347522735596, -5.017931938171387, -4.6395158767700195, -4.2611002922058105, -3.8826847076416016, -3.5042688846588135, -3.1258530616760254, -2.7474374771118164, -2.3690218925476074, -1.9906060695648193, -1.6121903657913208, -1.2337746620178223, -0.8553589582443237, -0.4769432544708252, -0.09852743148803711, 0.2798891067504883, 0.6583048105239868, 1.0367205142974854, 1.4151362180709839, 1.7935519218444824, 2.1719675064086914, 2.5503833293914795, 2.9287991523742676, 3.3072147369384766, 3.6856303215026855, 4.0640459060668945, 4.442461967468262, 4.820877552032471, 5.19929313659668, 5.577709197998047, 5.956124782562256, 6.334540367126465, 6.712955951690674, 7.091371536254883, 7.46978759765625, 7.848203182220459, 8.226618766784668, 8.605034828186035, 8.983449935913086, 9.361865997314453, 9.74028205871582, 10.118697166442871, 10.497113227844238, 10.875528335571289, 11.253944396972656, 11.632360458374023, 12.01077651977539, 12.389191627502441]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 14.0, 26.0, 35.0, 50.0, 61.0, 122.0, 206.0, 330.0, 634.0, 1225.0, 2515.0, 5730.0, 15573.0, 63216.0, 3936408.0, 130129.0, 22840.0, 7788.0, 3426.0, 1660.0, 917.0, 488.0, 306.0, 179.0, 115.0, 74.0, 64.0, 33.0, 26.0, 26.0, 14.0, 13.0, 9.0, 7.0, 1.0, 1.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.49111175537109375, -0.4719696044921875, -0.45282745361328125, -0.433685302734375, -0.41454315185546875, -0.3954010009765625, -0.37625885009765625, -0.35711669921875, -0.33797454833984375, -0.3188323974609375, -0.29969024658203125, -0.280548095703125, -0.26140594482421875, -0.2422637939453125, -0.22312164306640625, -0.2039794921875, -0.18483734130859375, -0.1656951904296875, -0.14655303955078125, -0.127410888671875, -0.10826873779296875, -0.0891265869140625, -0.06998443603515625, -0.05084228515625, -0.03170013427734375, -0.0125579833984375, 0.00658416748046875, 0.025726318359375, 0.04486846923828125, 0.0640106201171875, 0.08315277099609375, 0.102294921875, 0.12143707275390625, 0.1405792236328125, 0.15972137451171875, 0.178863525390625, 0.19800567626953125, 0.2171478271484375, 0.23628997802734375, 0.25543212890625, 0.27457427978515625, 0.2937164306640625, 0.31285858154296875, 0.332000732421875, 0.35114288330078125, 0.3702850341796875, 0.38942718505859375, 0.4085693359375, 0.42771148681640625, 0.4468536376953125, 0.46599578857421875, 0.485137939453125, 0.5042800903320312, 0.5234222412109375, 0.5425643920898438, 0.56170654296875, 0.5808486938476562, 0.5999908447265625, 0.6191329956054688, 0.638275146484375, 0.6574172973632812, 0.6765594482421875, 0.6957015991210938, 0.71484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 7.0, 2.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 14.0, 15.0, 11.0, 76.0, 719.0, 14.0, 11.0, 15.0, 9.0, 12.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059906005859375, -0.05779600143432617, -0.055685997009277344, -0.053575992584228516, -0.05146598815917969, -0.04935598373413086, -0.04724597930908203, -0.0451359748840332, -0.043025970458984375, -0.04091596603393555, -0.03880596160888672, -0.03669595718383789, -0.03458595275878906, -0.032475948333740234, -0.030365943908691406, -0.028255939483642578, -0.02614593505859375, -0.024035930633544922, -0.021925926208496094, -0.019815921783447266, -0.017705917358398438, -0.01559591293334961, -0.013485908508300781, -0.011375904083251953, -0.009265899658203125, -0.007155895233154297, -0.005045890808105469, -0.0029358863830566406, -0.0008258819580078125, 0.0012841224670410156, 0.0033941268920898438, 0.005504131317138672, 0.0076141357421875, 0.009724140167236328, 0.011834144592285156, 0.013944149017333984, 0.016054153442382812, 0.01816415786743164, 0.02027416229248047, 0.022384166717529297, 0.024494171142578125, 0.026604175567626953, 0.02871417999267578, 0.03082418441772461, 0.03293418884277344, 0.035044193267822266, 0.037154197692871094, 0.03926420211791992, 0.04137420654296875, 0.04348421096801758, 0.045594215393066406, 0.047704219818115234, 0.04981422424316406, 0.05192422866821289, 0.05403423309326172, 0.05614423751831055, 0.058254241943359375, 0.0603642463684082, 0.06247425079345703, 0.06458425521850586, 0.06669425964355469, 0.06880426406860352, 0.07091426849365234, 0.07302427291870117, 0.07513427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 19.0, 13.0, 9.0, 22.0, 31.0, 43.0, 63.0, 137.0, 170.0, 308.0, 560.0, 1139.0, 2196.0, 4527.0, 9845.0, 25172.0, 74534.0, 287590.0, 2227527.0, 1267205.0, 199568.0, 56823.0, 20116.0, 8531.0, 3898.0, 1941.0, 969.0, 533.0, 268.0, 174.0, 116.0, 59.0, 39.0, 38.0, 25.0, 20.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.314697265625, -0.3048248291015625, -0.294952392578125, -0.2850799560546875, -0.27520751953125, -0.2653350830078125, -0.255462646484375, -0.2455902099609375, -0.2357177734375, -0.2258453369140625, -0.215972900390625, -0.2061004638671875, -0.19622802734375, -0.1863555908203125, -0.176483154296875, -0.1666107177734375, -0.15673828125, -0.1468658447265625, -0.136993408203125, -0.1271209716796875, -0.11724853515625, -0.1073760986328125, -0.097503662109375, -0.0876312255859375, -0.0777587890625, -0.0678863525390625, -0.058013916015625, -0.0481414794921875, -0.03826904296875, -0.0283966064453125, -0.018524169921875, -0.0086517333984375, 0.001220703125, 0.0110931396484375, 0.020965576171875, 0.0308380126953125, 0.04071044921875, 0.0505828857421875, 0.060455322265625, 0.0703277587890625, 0.0802001953125, 0.0900726318359375, 0.099945068359375, 0.1098175048828125, 0.11968994140625, 0.1295623779296875, 0.139434814453125, 0.1493072509765625, 0.1591796875, 0.1690521240234375, 0.178924560546875, 0.1887969970703125, 0.19866943359375, 0.2085418701171875, 0.218414306640625, 0.2282867431640625, 0.2381591796875, 0.2480316162109375, 0.257904052734375, 0.2677764892578125, 0.27764892578125, 0.2875213623046875, 0.297393798828125, 0.3072662353515625, 0.317138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 7.0, 3.0, 7.0, 11.0, 13.0, 9.0, 21.0, 27.0, 37.0, 65.0, 60.0, 105.0, 136.0, 206.0, 284.0, 501.0, 866.0, 586.0, 367.0, 211.0, 132.0, 107.0, 107.0, 41.0, 38.0, 25.0, 25.0, 17.0, 14.0, 12.0, 8.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.138427734375, -0.13474464416503906, -0.13106155395507812, -0.1273784637451172, -0.12369537353515625, -0.12001228332519531, -0.11632919311523438, -0.11264610290527344, -0.1089630126953125, -0.10527992248535156, -0.10159683227539062, -0.09791374206542969, -0.09423065185546875, -0.09054756164550781, -0.08686447143554688, -0.08318138122558594, -0.079498291015625, -0.07581520080566406, -0.07213211059570312, -0.06844902038574219, -0.06476593017578125, -0.06108283996582031, -0.057399749755859375, -0.05371665954589844, -0.0500335693359375, -0.04635047912597656, -0.042667388916015625, -0.03898429870605469, -0.03530120849609375, -0.03161811828613281, -0.027935028076171875, -0.024251937866210938, -0.02056884765625, -0.016885757446289062, -0.013202667236328125, -0.009519577026367188, -0.00583648681640625, -0.0021533966064453125, 0.001529693603515625, 0.0052127838134765625, 0.0088958740234375, 0.012578964233398438, 0.016262054443359375, 0.019945144653320312, 0.02362823486328125, 0.027311325073242188, 0.030994415283203125, 0.03467750549316406, 0.038360595703125, 0.04204368591308594, 0.045726776123046875, 0.04940986633300781, 0.05309295654296875, 0.05677604675292969, 0.060459136962890625, 0.06414222717285156, 0.0678253173828125, 0.07150840759277344, 0.07519149780273438, 0.07887458801269531, 0.08255767822265625, 0.08624076843261719, 0.08992385864257812, 0.09360694885253906, 0.0972900390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 8.0, 11.0, 21.0, 56.0, 74.0, 134.0, 160.0, 157.0, 145.0, 90.0, 58.0, 33.0, 12.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5847426652908325, -0.5522713661193848, -0.519800066947937, -0.48732873797416687, -0.4548574388027191, -0.42238613963127136, -0.3899148106575012, -0.35744351148605347, -0.3249722123146057, -0.29250091314315796, -0.2600296139717102, -0.22755828499794006, -0.1950869858264923, -0.16261568665504456, -0.1301443725824356, -0.09767305850982666, -0.0652017593383789, -0.032730452716350555, -0.0002591460943222046, 0.032212160527706146, 0.0646834671497345, 0.09715476632118225, 0.1296260803937912, 0.16209739446640015, 0.1945686936378479, 0.22703999280929565, 0.2595112919807434, 0.29198262095451355, 0.3244539201259613, 0.35692521929740906, 0.3893965482711792, 0.42186784744262695, 0.45433902740478516, 0.4868103265762329, 0.5192816257476807, 0.5517529249191284, 0.5842242240905762, 0.6166955232620239, 0.6491668820381165, 0.6816381812095642, 0.714109480381012, 0.7465807795524597, 0.7790520787239075, 0.8115233778953552, 0.8439947366714478, 0.8764660358428955, 0.9089373350143433, 0.941408634185791, 0.9738799333572388, 1.0063512325286865, 1.0388225317001343, 1.071293830871582, 1.1037651300430298, 1.1362364292144775, 1.1687077283859253, 1.201179027557373, 1.2336504459381104, 1.266121745109558, 1.2985930442810059, 1.3310643434524536, 1.3635356426239014, 1.3960069417953491, 1.4284782409667969, 1.4609496593475342, 1.4934208393096924]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 12.0, 16.0, 22.0, 24.0, 48.0, 43.0, 54.0, 58.0, 66.0, 64.0, 58.0, 69.0, 58.0, 65.0, 55.0, 45.0, 50.0, 45.0, 35.0, 19.0, 15.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6479199528694153, -0.6287246346473694, -0.6095293164253235, -0.5903339982032776, -0.5711386799812317, -0.5519433617591858, -0.5327480435371399, -0.5135527849197388, -0.4943574368953705, -0.4751621186733246, -0.4559668004512787, -0.4367714822292328, -0.4175761938095093, -0.3983808755874634, -0.3791855573654175, -0.3599902391433716, -0.3407949209213257, -0.3215996026992798, -0.3024042844772339, -0.283208966255188, -0.2640136480331421, -0.24481834471225739, -0.22562304139137268, -0.20642772316932678, -0.18723240494728088, -0.16803708672523499, -0.1488417685031891, -0.12964646518230438, -0.11045114696025848, -0.09125582873821259, -0.07206051796674728, -0.05286520719528198, -0.033669888973236084, -0.014474574476480484, 0.004720740020275116, 0.023916054517030716, 0.043111369013786316, 0.062306687235832214, 0.08150199800729752, 0.10069730877876282, 0.11989262700080872, 0.13908794522285461, 0.1582832634449005, 0.17747856676578522, 0.19667388498783112, 0.21586920320987701, 0.23506450653076172, 0.2542598247528076, 0.2734551429748535, 0.2926504611968994, 0.3118457794189453, 0.3310410976409912, 0.3502364158630371, 0.369431734085083, 0.3886270225048065, 0.4078223407268524, 0.4270176589488983, 0.4462129771709442, 0.4654082953929901, 0.484603613615036, 0.5037989020347595, 0.5229942202568054, 0.5421895384788513, 0.5613848567008972, 0.5805801749229431]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 10.0, 20.0, 32.0, 36.0, 50.0, 78.0, 116.0, 170.0, 231.0, 396.0, 549.0, 892.0, 1339.0, 2325.0, 3405.0, 5680.0, 9469.0, 16380.0, 32045.0, 393414.0, 504835.0, 34300.0, 17039.0, 9819.0, 5926.0, 3606.0, 2193.0, 1440.0, 957.0, 611.0, 395.0, 253.0, 181.0, 113.0, 67.0, 46.0, 37.0, 31.0, 22.0, 11.0, 10.0, 7.0, 7.0, 2.0, 1.0, 5.0], "bins": [-0.47998046875, -0.4673614501953125, -0.454742431640625, -0.4421234130859375, -0.42950439453125, -0.4168853759765625, -0.404266357421875, -0.3916473388671875, -0.3790283203125, -0.3664093017578125, -0.353790283203125, -0.3411712646484375, -0.32855224609375, -0.3159332275390625, -0.303314208984375, -0.2906951904296875, -0.278076171875, -0.2654571533203125, -0.252838134765625, -0.2402191162109375, -0.22760009765625, -0.2149810791015625, -0.202362060546875, -0.1897430419921875, -0.1771240234375, -0.1645050048828125, -0.151885986328125, -0.1392669677734375, -0.12664794921875, -0.1140289306640625, -0.101409912109375, -0.0887908935546875, -0.076171875, -0.0635528564453125, -0.050933837890625, -0.0383148193359375, -0.02569580078125, -0.0130767822265625, -0.000457763671875, 0.0121612548828125, 0.0247802734375, 0.0373992919921875, 0.050018310546875, 0.0626373291015625, 0.07525634765625, 0.0878753662109375, 0.100494384765625, 0.1131134033203125, 0.125732421875, 0.1383514404296875, 0.150970458984375, 0.1635894775390625, 0.17620849609375, 0.1888275146484375, 0.201446533203125, 0.2140655517578125, 0.2266845703125, 0.2393035888671875, 0.251922607421875, 0.2645416259765625, 0.27716064453125, 0.2897796630859375, 0.302398681640625, 0.3150177001953125, 0.32763671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 8.0, 10.0, 18.0, 36.0, 86.0, 242.0, 273.0, 156.0, 43.0, 17.0, 11.0, 11.0, 5.0, 6.0, 7.0, 2.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05657958984375, -0.054511070251464844, -0.05244255065917969, -0.05037403106689453, -0.048305511474609375, -0.04623699188232422, -0.04416847229003906, -0.042099952697753906, -0.04003143310546875, -0.037962913513183594, -0.03589439392089844, -0.03382587432861328, -0.031757354736328125, -0.02968883514404297, -0.027620315551757812, -0.025551795959472656, -0.0234832763671875, -0.021414756774902344, -0.019346237182617188, -0.01727771759033203, -0.015209197998046875, -0.013140678405761719, -0.011072158813476562, -0.009003639221191406, -0.00693511962890625, -0.004866600036621094, -0.0027980804443359375, -0.0007295608520507812, 0.001338958740234375, 0.0034074783325195312, 0.0054759979248046875, 0.007544517517089844, 0.009613037109375, 0.011681556701660156, 0.013750076293945312, 0.01581859588623047, 0.017887115478515625, 0.01995563507080078, 0.022024154663085938, 0.024092674255371094, 0.02616119384765625, 0.028229713439941406, 0.030298233032226562, 0.03236675262451172, 0.034435272216796875, 0.03650379180908203, 0.03857231140136719, 0.040640830993652344, 0.0427093505859375, 0.044777870178222656, 0.04684638977050781, 0.04891490936279297, 0.050983428955078125, 0.05305194854736328, 0.05512046813964844, 0.057188987731933594, 0.05925750732421875, 0.061326026916503906, 0.06339454650878906, 0.06546306610107422, 0.06753158569335938, 0.06960010528564453, 0.07166862487792969, 0.07373714447021484, 0.0758056640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 3.0, 4.0, 10.0, 13.0, 15.0, 19.0, 30.0, 42.0, 61.0, 74.0, 110.0, 172.0, 207.0, 438.0, 692.0, 1354.0, 2852.0, 7290.0, 22240.0, 86954.0, 358226.0, 419511.0, 106588.0, 26522.0, 8336.0, 3242.0, 1497.0, 750.0, 433.0, 266.0, 167.0, 115.0, 82.0, 67.0, 45.0, 32.0, 26.0, 16.0, 12.0, 8.0, 11.0, 6.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434814453125, -0.4198570251464844, -0.40489959716796875, -0.3899421691894531, -0.3749847412109375, -0.3600273132324219, -0.34506988525390625, -0.3301124572753906, -0.315155029296875, -0.3001976013183594, -0.28524017333984375, -0.2702827453613281, -0.2553253173828125, -0.24036788940429688, -0.22541046142578125, -0.21045303344726562, -0.19549560546875, -0.18053817749023438, -0.16558074951171875, -0.15062332153320312, -0.1356658935546875, -0.12070846557617188, -0.10575103759765625, -0.09079360961914062, -0.075836181640625, -0.060878753662109375, -0.04592132568359375, -0.030963897705078125, -0.0160064697265625, -0.001049041748046875, 0.01390838623046875, 0.028865814208984375, 0.0438232421875, 0.058780670166015625, 0.07373809814453125, 0.08869552612304688, 0.1036529541015625, 0.11861038208007812, 0.13356781005859375, 0.14852523803710938, 0.163482666015625, 0.17844009399414062, 0.19339752197265625, 0.20835494995117188, 0.2233123779296875, 0.23826980590820312, 0.25322723388671875, 0.2681846618652344, 0.28314208984375, 0.2980995178222656, 0.31305694580078125, 0.3280143737792969, 0.3429718017578125, 0.3579292297363281, 0.37288665771484375, 0.3878440856933594, 0.402801513671875, 0.4177589416503906, 0.43271636962890625, 0.4476737976074219, 0.4626312255859375, 0.4775886535644531, 0.49254608154296875, 0.5075035095214844, 0.5224609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 8.0, 8.0, 15.0, 18.0, 17.0, 20.0, 19.0, 27.0, 33.0, 28.0, 41.0, 40.0, 43.0, 45.0, 41.0, 45.0, 41.0, 38.0, 45.0, 34.0, 45.0, 45.0, 33.0, 35.0, 30.0, 26.0, 24.0, 20.0, 17.0, 19.0, 17.0, 14.0, 14.0, 14.0, 5.0, 3.0, 3.0, 3.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.29541015625, -0.28730010986328125, -0.2791900634765625, -0.27108001708984375, -0.262969970703125, -0.25485992431640625, -0.2467498779296875, -0.23863983154296875, -0.23052978515625, -0.22241973876953125, -0.2143096923828125, -0.20619964599609375, -0.198089599609375, -0.18997955322265625, -0.1818695068359375, -0.17375946044921875, -0.1656494140625, -0.15753936767578125, -0.1494293212890625, -0.14131927490234375, -0.133209228515625, -0.12509918212890625, -0.1169891357421875, -0.10887908935546875, -0.10076904296875, -0.09265899658203125, -0.0845489501953125, -0.07643890380859375, -0.068328857421875, -0.06021881103515625, -0.0521087646484375, -0.04399871826171875, -0.035888671875, -0.02777862548828125, -0.0196685791015625, -0.01155853271484375, -0.003448486328125, 0.00466156005859375, 0.0127716064453125, 0.02088165283203125, 0.02899169921875, 0.03710174560546875, 0.0452117919921875, 0.05332183837890625, 0.061431884765625, 0.06954193115234375, 0.0776519775390625, 0.08576202392578125, 0.0938720703125, 0.10198211669921875, 0.1100921630859375, 0.11820220947265625, 0.126312255859375, 0.13442230224609375, 0.1425323486328125, 0.15064239501953125, 0.15875244140625, 0.16686248779296875, 0.1749725341796875, 0.18308258056640625, 0.191192626953125, 0.19930267333984375, 0.2074127197265625, 0.21552276611328125, 0.2236328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 15.0, 23.0, 41.0, 62.0, 88.0, 173.0, 395.0, 869.0, 2711.0, 12907.0, 393653.0, 616950.0, 15857.0, 2970.0, 967.0, 382.0, 196.0, 110.0, 49.0, 32.0, 14.0, 20.0, 21.0, 7.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97314453125, -0.942779541015625, -0.91241455078125, -0.882049560546875, -0.8516845703125, -0.821319580078125, -0.79095458984375, -0.760589599609375, -0.730224609375, -0.699859619140625, -0.66949462890625, -0.639129638671875, -0.6087646484375, -0.578399658203125, -0.54803466796875, -0.517669677734375, -0.4873046875, -0.456939697265625, -0.42657470703125, -0.396209716796875, -0.3658447265625, -0.335479736328125, -0.30511474609375, -0.274749755859375, -0.244384765625, -0.214019775390625, -0.18365478515625, -0.153289794921875, -0.1229248046875, -0.092559814453125, -0.06219482421875, -0.031829833984375, -0.00146484375, 0.028900146484375, 0.05926513671875, 0.089630126953125, 0.1199951171875, 0.150360107421875, 0.18072509765625, 0.211090087890625, 0.241455078125, 0.271820068359375, 0.30218505859375, 0.332550048828125, 0.3629150390625, 0.393280029296875, 0.42364501953125, 0.454010009765625, 0.484375, 0.514739990234375, 0.54510498046875, 0.575469970703125, 0.6058349609375, 0.636199951171875, 0.66656494140625, 0.696929931640625, 0.727294921875, 0.757659912109375, 0.78802490234375, 0.818389892578125, 0.8487548828125, 0.879119873046875, 0.90948486328125, 0.939849853515625, 0.97021484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 7.0, 10.0, 18.0, 31.0, 49.0, 65.0, 90.0, 121.0, 123.0, 119.0, 108.0, 78.0, 58.0, 40.0, 29.0, 16.0, 12.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21540641784668e-05, -5.070120096206665e-05, -4.9248337745666504e-05, -4.779547452926636e-05, -4.634261131286621e-05, -4.4889748096466064e-05, -4.343688488006592e-05, -4.198402166366577e-05, -4.0531158447265625e-05, -3.907829523086548e-05, -3.762543201446533e-05, -3.6172568798065186e-05, -3.471970558166504e-05, -3.326684236526489e-05, -3.1813979148864746e-05, -3.03611159324646e-05, -2.8908252716064453e-05, -2.7455389499664307e-05, -2.600252628326416e-05, -2.4549663066864014e-05, -2.3096799850463867e-05, -2.164393663406372e-05, -2.0191073417663574e-05, -1.8738210201263428e-05, -1.728534698486328e-05, -1.5832483768463135e-05, -1.4379620552062988e-05, -1.2926757335662842e-05, -1.1473894119262695e-05, -1.0021030902862549e-05, -8.568167686462402e-06, -7.115304470062256e-06, -5.662441253662109e-06, -4.209578037261963e-06, -2.7567148208618164e-06, -1.30385160446167e-06, 1.4901161193847656e-07, 1.601874828338623e-06, 3.0547380447387695e-06, 4.507601261138916e-06, 5.9604644775390625e-06, 7.413327693939209e-06, 8.866190910339355e-06, 1.0319054126739502e-05, 1.1771917343139648e-05, 1.3224780559539795e-05, 1.4677643775939941e-05, 1.6130506992340088e-05, 1.7583370208740234e-05, 1.903623342514038e-05, 2.0489096641540527e-05, 2.1941959857940674e-05, 2.339482307434082e-05, 2.4847686290740967e-05, 2.6300549507141113e-05, 2.775341272354126e-05, 2.9206275939941406e-05, 3.065913915634155e-05, 3.21120023727417e-05, 3.3564865589141846e-05, 3.501772880554199e-05, 3.647059202194214e-05, 3.7923455238342285e-05, 3.937631845474243e-05, 4.082918167114258e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 2.0, 10.0, 10.0, 19.0, 34.0, 72.0, 123.0, 255.0, 674.0, 1686.0, 5718.0, 25476.0, 199966.0, 681319.0, 110207.0, 16544.0, 4109.0, 1329.0, 543.0, 218.0, 93.0, 55.0, 38.0, 22.0, 10.0, 7.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61474609375, -0.598724365234375, -0.58270263671875, -0.566680908203125, -0.5506591796875, -0.534637451171875, -0.51861572265625, -0.502593994140625, -0.486572265625, -0.470550537109375, -0.45452880859375, -0.438507080078125, -0.4224853515625, -0.406463623046875, -0.39044189453125, -0.374420166015625, -0.3583984375, -0.342376708984375, -0.32635498046875, -0.310333251953125, -0.2943115234375, -0.278289794921875, -0.26226806640625, -0.246246337890625, -0.230224609375, -0.214202880859375, -0.19818115234375, -0.182159423828125, -0.1661376953125, -0.150115966796875, -0.13409423828125, -0.118072509765625, -0.10205078125, -0.086029052734375, -0.07000732421875, -0.053985595703125, -0.0379638671875, -0.021942138671875, -0.00592041015625, 0.010101318359375, 0.026123046875, 0.042144775390625, 0.05816650390625, 0.074188232421875, 0.0902099609375, 0.106231689453125, 0.12225341796875, 0.138275146484375, 0.154296875, 0.170318603515625, 0.18634033203125, 0.202362060546875, 0.2183837890625, 0.234405517578125, 0.25042724609375, 0.266448974609375, 0.282470703125, 0.298492431640625, 0.31451416015625, 0.330535888671875, 0.3465576171875, 0.362579345703125, 0.37860107421875, 0.394622802734375, 0.41064453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 6.0, 5.0, 8.0, 3.0, 6.0, 12.0, 29.0, 26.0, 31.0, 46.0, 40.0, 48.0, 61.0, 54.0, 65.0, 59.0, 73.0, 64.0, 56.0, 43.0, 46.0, 42.0, 43.0, 27.0, 23.0, 18.0, 14.0, 4.0, 9.0, 8.0, 3.0, 7.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.28591156005859375, -0.2769012451171875, -0.26789093017578125, -0.258880615234375, -0.24987030029296875, -0.2408599853515625, -0.23184967041015625, -0.22283935546875, -0.21382904052734375, -0.2048187255859375, -0.19580841064453125, -0.186798095703125, -0.17778778076171875, -0.1687774658203125, -0.15976715087890625, -0.1507568359375, -0.14174652099609375, -0.1327362060546875, -0.12372589111328125, -0.114715576171875, -0.10570526123046875, -0.0966949462890625, -0.08768463134765625, -0.07867431640625, -0.06966400146484375, -0.0606536865234375, -0.05164337158203125, -0.042633056640625, -0.03362274169921875, -0.0246124267578125, -0.01560211181640625, -0.006591796875, 0.00241851806640625, 0.0114288330078125, 0.02043914794921875, 0.029449462890625, 0.03845977783203125, 0.0474700927734375, 0.05648040771484375, 0.06549072265625, 0.07450103759765625, 0.0835113525390625, 0.09252166748046875, 0.101531982421875, 0.11054229736328125, 0.1195526123046875, 0.12856292724609375, 0.1375732421875, 0.14658355712890625, 0.1555938720703125, 0.16460418701171875, 0.173614501953125, 0.18262481689453125, 0.1916351318359375, 0.20064544677734375, 0.20965576171875, 0.21866607666015625, 0.2276763916015625, 0.23668670654296875, 0.245697021484375, 0.25470733642578125, 0.2637176513671875, 0.27272796630859375, 0.28173828125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 11.0, 8.0, 20.0, 53.0, 98.0, 232.0, 290.0, 142.0, 73.0, 21.0, 13.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.161901473999023, -4.965007305145264, -4.768112659454346, -4.571218490600586, -4.374323844909668, -4.177429676055908, -3.9805352687835693, -3.7836408615112305, -3.5867464542388916, -3.3898520469665527, -3.192957639694214, -2.996063232421875, -2.7991690635681152, -2.6022744178771973, -2.4053802490234375, -2.2084858417510986, -2.0115914344787598, -1.814697027206421, -1.617802619934082, -1.4209083318710327, -1.2240139245986938, -1.027119517326355, -0.8302252292633057, -0.6333308219909668, -0.43643641471862793, -0.23954203724861145, -0.04264765977859497, 0.15424668788909912, 0.351141095161438, 0.5480355024337769, 0.7449297904968262, 0.941824197769165, 1.138718605041504, 1.3356130123138428, 1.5325074195861816, 1.729401707649231, 1.9262961149215698, 2.123190402984619, 2.320084810256958, 2.516979217529297, 2.7138736248016357, 2.9107680320739746, 3.1076624393463135, 3.3045568466186523, 3.501451015472412, 3.69834566116333, 3.89523983001709, 4.092134475708008, 4.289028644561768, 4.485922813415527, 4.682817459106445, 4.879711627960205, 5.076606273651123, 5.273500442504883, 5.470395088195801, 5.6672892570495605, 5.86418342590332, 6.06107759475708, 6.257972240447998, 6.454866409301758, 6.651761054992676, 6.8486552238464355, 7.045549392700195, 7.242444038391113, 7.439338684082031]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 2.0, 7.0, 4.0, 6.0, 10.0, 10.0, 14.0, 14.0, 32.0, 44.0, 66.0, 109.0, 127.0, 131.0, 134.0, 90.0, 53.0, 45.0, 21.0, 10.0, 11.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.683117866516113, -5.527040958404541, -5.370964050292969, -5.214886665344238, -5.058809757232666, -4.902732849121094, -4.7466559410095215, -4.590579032897949, -4.434501647949219, -4.2784247398376465, -4.122347831726074, -3.966270685195923, -3.8101935386657715, -3.654116630554199, -3.498039722442627, -3.3419625759124756, -3.1858856678009033, -3.029808759689331, -2.8737316131591797, -2.7176547050476074, -2.561577558517456, -2.405500650405884, -2.2494235038757324, -2.09334659576416, -1.9372695684432983, -1.7811925411224365, -1.6251155138015747, -1.469038486480713, -1.3129615783691406, -1.1568844318389893, -1.000807523727417, -0.8447304964065552, -0.6886534690856934, -0.5325764417648315, -0.3764994442462921, -0.22042244672775269, -0.06434541940689087, 0.09173160791397095, 0.247808575630188, 0.4038856029510498, 0.5599626302719116, 0.7160396575927734, 0.8721166849136353, 1.028193712234497, 1.1842706203460693, 1.3403477668762207, 1.496424674987793, 1.6525017023086548, 1.8085787296295166, 1.9646557569503784, 2.1207327842712402, 2.2768096923828125, 2.432886838912964, 2.588963747024536, 2.7450408935546875, 2.9011178016662598, 3.057194709777832, 3.2132716178894043, 3.3693487644195557, 3.525425672531128, 3.6815028190612793, 3.8375797271728516, 3.993656635284424, 4.149733543395996, 4.305810928344727]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 6.0, 21.0, 37.0, 76.0, 259.0, 1620.0, 20500.0, 4132452.0, 36671.0, 2088.0, 336.0, 125.0, 33.0, 20.0, 8.0, 12.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.914581298828125, -4.80181884765625, -4.689056396484375, -4.5762939453125, -4.463531494140625, -4.35076904296875, -4.238006591796875, -4.125244140625, -4.012481689453125, -3.89971923828125, -3.786956787109375, -3.6741943359375, -3.561431884765625, -3.44866943359375, -3.335906982421875, -3.22314453125, -3.110382080078125, -2.99761962890625, -2.884857177734375, -2.7720947265625, -2.659332275390625, -2.54656982421875, -2.433807373046875, -2.321044921875, -2.208282470703125, -2.09552001953125, -1.982757568359375, -1.8699951171875, -1.757232666015625, -1.64447021484375, -1.531707763671875, -1.4189453125, -1.306182861328125, -1.19342041015625, -1.080657958984375, -0.9678955078125, -0.855133056640625, -0.74237060546875, -0.629608154296875, -0.516845703125, -0.404083251953125, -0.29132080078125, -0.178558349609375, -0.0657958984375, 0.046966552734375, 0.15972900390625, 0.272491455078125, 0.38525390625, 0.498016357421875, 0.61077880859375, 0.723541259765625, 0.8363037109375, 0.949066162109375, 1.06182861328125, 1.174591064453125, 1.287353515625, 1.400115966796875, 1.51287841796875, 1.625640869140625, 1.7384033203125, 1.851165771484375, 1.96392822265625, 2.076690673828125, 2.189453125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 4.0, 4.0, 11.0, 10.0, 14.0, 25.0, 34.0, 80.0, 151.0, 208.0, 190.0, 94.0, 56.0, 27.0, 15.0, 7.0, 7.0, 7.0, 3.0, 15.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06632328033447266, -0.06416511535644531, -0.06200695037841797, -0.059848785400390625, -0.05769062042236328, -0.05553245544433594, -0.053374290466308594, -0.05121612548828125, -0.049057960510253906, -0.04689979553222656, -0.04474163055419922, -0.042583465576171875, -0.04042530059814453, -0.03826713562011719, -0.036108970642089844, -0.0339508056640625, -0.031792640686035156, -0.029634475708007812, -0.02747631072998047, -0.025318145751953125, -0.02315998077392578, -0.021001815795898438, -0.018843650817871094, -0.01668548583984375, -0.014527320861816406, -0.012369155883789062, -0.010210990905761719, -0.008052825927734375, -0.005894660949707031, -0.0037364959716796875, -0.0015783309936523438, 0.000579833984375, 0.0027379989624023438, 0.0048961639404296875, 0.007054328918457031, 0.009212493896484375, 0.011370658874511719, 0.013528823852539062, 0.015686988830566406, 0.01784515380859375, 0.020003318786621094, 0.022161483764648438, 0.02431964874267578, 0.026477813720703125, 0.02863597869873047, 0.030794143676757812, 0.032952308654785156, 0.0351104736328125, 0.037268638610839844, 0.03942680358886719, 0.04158496856689453, 0.043743133544921875, 0.04590129852294922, 0.04805946350097656, 0.050217628479003906, 0.05237579345703125, 0.054533958435058594, 0.05669212341308594, 0.05885028839111328, 0.061008453369140625, 0.06316661834716797, 0.06532478332519531, 0.06748294830322266, 0.06964111328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 11.0, 24.0, 25.0, 33.0, 43.0, 80.0, 100.0, 171.0, 220.0, 397.0, 629.0, 1047.0, 1845.0, 3331.0, 6646.0, 14719.0, 38548.0, 149458.0, 2134174.0, 1639921.0, 137068.0, 36876.0, 14183.0, 6498.0, 3301.0, 1918.0, 1098.0, 665.0, 425.0, 276.0, 175.0, 132.0, 71.0, 51.0, 30.0, 24.0, 19.0, 15.0, 9.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.522613525390625, -0.50323486328125, -0.483856201171875, -0.4644775390625, -0.445098876953125, -0.42572021484375, -0.406341552734375, -0.386962890625, -0.367584228515625, -0.34820556640625, -0.328826904296875, -0.3094482421875, -0.290069580078125, -0.27069091796875, -0.251312255859375, -0.23193359375, -0.212554931640625, -0.19317626953125, -0.173797607421875, -0.1544189453125, -0.135040283203125, -0.11566162109375, -0.096282958984375, -0.076904296875, -0.057525634765625, -0.03814697265625, -0.018768310546875, 0.0006103515625, 0.019989013671875, 0.03936767578125, 0.058746337890625, 0.078125, 0.097503662109375, 0.11688232421875, 0.136260986328125, 0.1556396484375, 0.175018310546875, 0.19439697265625, 0.213775634765625, 0.233154296875, 0.252532958984375, 0.27191162109375, 0.291290283203125, 0.3106689453125, 0.330047607421875, 0.34942626953125, 0.368804931640625, 0.38818359375, 0.407562255859375, 0.42694091796875, 0.446319580078125, 0.4656982421875, 0.485076904296875, 0.50445556640625, 0.523834228515625, 0.543212890625, 0.562591552734375, 0.58197021484375, 0.601348876953125, 0.6207275390625, 0.640106201171875, 0.65948486328125, 0.678863525390625, 0.6982421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 9.0, 10.0, 19.0, 7.0, 19.0, 22.0, 41.0, 92.0, 168.0, 374.0, 1186.0, 1256.0, 408.0, 170.0, 94.0, 67.0, 36.0, 30.0, 20.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14369773864746094, -0.13920211791992188, -0.1347064971923828, -0.13021087646484375, -0.1257152557373047, -0.12121963500976562, -0.11672401428222656, -0.1122283935546875, -0.10773277282714844, -0.10323715209960938, -0.09874153137207031, -0.09424591064453125, -0.08975028991699219, -0.08525466918945312, -0.08075904846191406, -0.076263427734375, -0.07176780700683594, -0.06727218627929688, -0.06277656555175781, -0.05828094482421875, -0.05378532409667969, -0.049289703369140625, -0.04479408264160156, -0.0402984619140625, -0.03580284118652344, -0.031307220458984375, -0.026811599731445312, -0.02231597900390625, -0.017820358276367188, -0.013324737548828125, -0.008829116821289062, -0.00433349609375, 0.0001621246337890625, 0.004657745361328125, 0.009153366088867188, 0.01364898681640625, 0.018144607543945312, 0.022640228271484375, 0.027135848999023438, 0.0316314697265625, 0.03612709045410156, 0.040622711181640625, 0.04511833190917969, 0.04961395263671875, 0.05410957336425781, 0.058605194091796875, 0.06310081481933594, 0.067596435546875, 0.07209205627441406, 0.07658767700195312, 0.08108329772949219, 0.08557891845703125, 0.09007453918457031, 0.09457015991210938, 0.09906578063964844, 0.1035614013671875, 0.10805702209472656, 0.11255264282226562, 0.11704826354980469, 0.12154388427734375, 0.1260395050048828, 0.13053512573242188, 0.13503074645996094, 0.1395263671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 30.0, 193.0, 517.0, 209.0, 44.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.846590280532837, -1.7603347301483154, -1.674079179763794, -1.5878236293792725, -1.501568078994751, -1.4153125286102295, -1.3290568590164185, -1.242801308631897, -1.1565457582473755, -1.070290207862854, -0.9840346574783325, -0.8977790474891663, -0.8115234971046448, -0.7252679467201233, -0.639012336730957, -0.5527567863464355, -0.46650123596191406, -0.3802456855773926, -0.2939901053905487, -0.20773452520370483, -0.12147897481918335, -0.035223424434661865, 0.051032185554504395, 0.13728773593902588, 0.22354328632354736, 0.30979883670806885, 0.3960544168949127, 0.4823099970817566, 0.5685655474662781, 0.6548210978507996, 0.7410767078399658, 0.8273322582244873, 0.9135878086090088, 0.9998433589935303, 1.0860989093780518, 1.1723544597625732, 1.2586100101470947, 1.3448655605316162, 1.4311212301254272, 1.5173767805099487, 1.6036323308944702, 1.6898878812789917, 1.7761434316635132, 1.8623991012573242, 1.9486546516418457, 2.034910202026367, 2.1211657524108887, 2.20742130279541, 2.2936768531799316, 2.379932403564453, 2.4661879539489746, 2.552443504333496, 2.6386990547180176, 2.724954605102539, 2.8112101554870605, 2.897465705871582, 2.9837212562561035, 3.069976806640625, 3.1562323570251465, 3.242487907409668, 3.3287434577941895, 3.414999008178711, 3.5012545585632324, 3.587510108947754, 3.6737658977508545]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 5.0, 5.0, 2.0, 4.0, 9.0, 6.0, 7.0, 18.0, 25.0, 35.0, 53.0, 56.0, 91.0, 92.0, 105.0, 115.0, 87.0, 70.0, 59.0, 49.0, 29.0, 19.0, 12.0, 13.0, 7.0, 8.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7490231394767761, -0.7257136702537537, -0.7024042010307312, -0.6790947318077087, -0.6557852029800415, -0.632475733757019, -0.6091662645339966, -0.5858567953109741, -0.5625473260879517, -0.5392378568649292, -0.5159283876419067, -0.4926188886165619, -0.46930941939353943, -0.44599995017051697, -0.4226904511451721, -0.39938098192214966, -0.3760715126991272, -0.35276204347610474, -0.3294525742530823, -0.3061430752277374, -0.28283360600471497, -0.2595241367816925, -0.23621465265750885, -0.2129051685333252, -0.18959569931030273, -0.16628623008728027, -0.14297674596309662, -0.11966726928949356, -0.0963577926158905, -0.07304831594228745, -0.04973883926868439, -0.026429355144500732, -0.003119826316833496, 0.020189650356769562, 0.04349912703037262, 0.06680860370397568, 0.09011808037757874, 0.1134275570511818, 0.13673703372478485, 0.1600465178489685, 0.18335598707199097, 0.20666545629501343, 0.22997494041919708, 0.25328442454338074, 0.2765938937664032, 0.29990336298942566, 0.3232128620147705, 0.34652233123779297, 0.36983180046081543, 0.3931412696838379, 0.41645073890686035, 0.4397602379322052, 0.46306970715522766, 0.4863791763782501, 0.509688675403595, 0.5329981446266174, 0.5563076138496399, 0.5796170830726624, 0.6029265522956848, 0.6262360215187073, 0.6495455503463745, 0.672855019569397, 0.6961644887924194, 0.7194739580154419, 0.7427834272384644]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 1.0, 5.0, 10.0, 13.0, 10.0, 19.0, 20.0, 34.0, 70.0, 128.0, 232.0, 434.0, 893.0, 2066.0, 5991.0, 19687.0, 107792.0, 751037.0, 127605.0, 21783.0, 6471.0, 2279.0, 968.0, 414.0, 239.0, 130.0, 72.0, 43.0, 24.0, 14.0, 7.0, 7.0, 6.0, 8.0, 4.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.78369140625, -0.7603225708007812, -0.7369537353515625, -0.7135848999023438, -0.690216064453125, -0.6668472290039062, -0.6434783935546875, -0.6201095581054688, -0.59674072265625, -0.5733718872070312, -0.5500030517578125, -0.5266342163085938, -0.503265380859375, -0.47989654541015625, -0.4565277099609375, -0.43315887451171875, -0.4097900390625, -0.38642120361328125, -0.3630523681640625, -0.33968353271484375, -0.316314697265625, -0.29294586181640625, -0.2695770263671875, -0.24620819091796875, -0.22283935546875, -0.19947052001953125, -0.1761016845703125, -0.15273284912109375, -0.129364013671875, -0.10599517822265625, -0.0826263427734375, -0.05925750732421875, -0.035888671875, -0.01251983642578125, 0.0108489990234375, 0.03421783447265625, 0.057586669921875, 0.08095550537109375, 0.1043243408203125, 0.12769317626953125, 0.15106201171875, 0.17443084716796875, 0.1977996826171875, 0.22116851806640625, 0.244537353515625, 0.26790618896484375, 0.2912750244140625, 0.31464385986328125, 0.3380126953125, 0.36138153076171875, 0.3847503662109375, 0.40811920166015625, 0.431488037109375, 0.45485687255859375, 0.4782257080078125, 0.5015945434570312, 0.52496337890625, 0.5483322143554688, 0.5717010498046875, 0.5950698852539062, 0.618438720703125, 0.6418075561523438, 0.6651763916015625, 0.6885452270507812, 0.7119140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 11.0, 9.0, 16.0, 30.0, 71.0, 106.0, 184.0, 198.0, 150.0, 98.0, 48.0, 23.0, 13.0, 4.0, 8.0, 9.0, 7.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04547119140625, -0.04298686981201172, -0.04050254821777344, -0.038018226623535156, -0.035533905029296875, -0.033049583435058594, -0.030565261840820312, -0.02808094024658203, -0.02559661865234375, -0.02311229705810547, -0.020627975463867188, -0.018143653869628906, -0.015659332275390625, -0.013175010681152344, -0.010690689086914062, -0.008206367492675781, -0.0057220458984375, -0.0032377243041992188, -0.0007534027099609375, 0.0017309188842773438, 0.004215240478515625, 0.006699562072753906, 0.009183883666992188, 0.011668205261230469, 0.01415252685546875, 0.01663684844970703, 0.019121170043945312, 0.021605491638183594, 0.024089813232421875, 0.026574134826660156, 0.029058456420898438, 0.03154277801513672, 0.034027099609375, 0.03651142120361328, 0.03899574279785156, 0.041480064392089844, 0.043964385986328125, 0.046448707580566406, 0.04893302917480469, 0.05141735076904297, 0.05390167236328125, 0.05638599395751953, 0.05887031555175781, 0.061354637145996094, 0.06383895874023438, 0.06632328033447266, 0.06880760192871094, 0.07129192352294922, 0.0737762451171875, 0.07626056671142578, 0.07874488830566406, 0.08122920989990234, 0.08371353149414062, 0.0861978530883789, 0.08868217468261719, 0.09116649627685547, 0.09365081787109375, 0.09613513946533203, 0.09861946105957031, 0.1011037826538086, 0.10358810424804688, 0.10607242584228516, 0.10855674743652344, 0.11104106903076172, 0.113525390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 5.0, 5.0, 5.0, 8.0, 9.0, 43.0, 187.0, 2296.0, 356094.0, 685696.0, 3814.0, 255.0, 40.0, 11.0, 2.0, 3.0, 9.0, 4.0, 1.0, 13.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.4140625, -2.3506622314453125, -2.287261962890625, -2.2238616943359375, -2.16046142578125, -2.0970611572265625, -2.033660888671875, -1.9702606201171875, -1.9068603515625, -1.8434600830078125, -1.780059814453125, -1.7166595458984375, -1.65325927734375, -1.5898590087890625, -1.526458740234375, -1.4630584716796875, -1.399658203125, -1.3362579345703125, -1.272857666015625, -1.2094573974609375, -1.14605712890625, -1.0826568603515625, -1.019256591796875, -0.9558563232421875, -0.8924560546875, -0.8290557861328125, -0.765655517578125, -0.7022552490234375, -0.63885498046875, -0.5754547119140625, -0.512054443359375, -0.4486541748046875, -0.38525390625, -0.3218536376953125, -0.258453369140625, -0.1950531005859375, -0.13165283203125, -0.0682525634765625, -0.004852294921875, 0.0585479736328125, 0.1219482421875, 0.1853485107421875, 0.248748779296875, 0.3121490478515625, 0.37554931640625, 0.4389495849609375, 0.502349853515625, 0.5657501220703125, 0.629150390625, 0.6925506591796875, 0.755950927734375, 0.8193511962890625, 0.88275146484375, 0.9461517333984375, 1.009552001953125, 1.0729522705078125, 1.1363525390625, 1.1997528076171875, 1.263153076171875, 1.3265533447265625, 1.38995361328125, 1.4533538818359375, 1.516754150390625, 1.5801544189453125, 1.6435546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 1.0, 3.0, 7.0, 15.0, 11.0, 13.0, 13.0, 16.0, 22.0, 15.0, 30.0, 32.0, 46.0, 42.0, 34.0, 47.0, 33.0, 38.0, 44.0, 38.0, 31.0, 44.0, 50.0, 36.0, 33.0, 42.0, 36.0, 36.0, 25.0, 23.0, 19.0, 10.0, 18.0, 15.0, 18.0, 10.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14833450317382812, -0.14286041259765625, -0.13738632202148438, -0.1319122314453125, -0.12643814086914062, -0.12096405029296875, -0.11548995971679688, -0.110015869140625, -0.10454177856445312, -0.09906768798828125, -0.09359359741210938, -0.0881195068359375, -0.08264541625976562, -0.07717132568359375, -0.07169723510742188, -0.06622314453125, -0.060749053955078125, -0.05527496337890625, -0.049800872802734375, -0.0443267822265625, -0.038852691650390625, -0.03337860107421875, -0.027904510498046875, -0.022430419921875, -0.016956329345703125, -0.01148223876953125, -0.006008148193359375, -0.0005340576171875, 0.004940032958984375, 0.01041412353515625, 0.015888214111328125, 0.0213623046875, 0.026836395263671875, 0.03231048583984375, 0.037784576416015625, 0.0432586669921875, 0.048732757568359375, 0.05420684814453125, 0.059680938720703125, 0.065155029296875, 0.07062911987304688, 0.07610321044921875, 0.08157730102539062, 0.0870513916015625, 0.09252548217773438, 0.09799957275390625, 0.10347366333007812, 0.10894775390625, 0.11442184448242188, 0.11989593505859375, 0.12537002563476562, 0.1308441162109375, 0.13631820678710938, 0.14179229736328125, 0.14726638793945312, 0.152740478515625, 0.15821456909179688, 0.16368865966796875, 0.16916275024414062, 0.1746368408203125, 0.18011093139648438, 0.18558502197265625, 0.19105911254882812, 0.196533203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 1.0, 15.0, 19.0, 84.0, 1540.0, 1046195.0, 611.0, 53.0, 18.0, 2.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.546875, -18.0635986328125, -17.580322265625, -17.0970458984375, -16.61376953125, -16.1304931640625, -15.647216796875, -15.1639404296875, -14.6806640625, -14.1973876953125, -13.714111328125, -13.2308349609375, -12.74755859375, -12.2642822265625, -11.781005859375, -11.2977294921875, -10.814453125, -10.3311767578125, -9.847900390625, -9.3646240234375, -8.88134765625, -8.3980712890625, -7.914794921875, -7.4315185546875, -6.9482421875, -6.4649658203125, -5.981689453125, -5.4984130859375, -5.01513671875, -4.5318603515625, -4.048583984375, -3.5653076171875, -3.08203125, -2.5987548828125, -2.115478515625, -1.6322021484375, -1.14892578125, -0.6656494140625, -0.182373046875, 0.3009033203125, 0.7841796875, 1.2674560546875, 1.750732421875, 2.2340087890625, 2.71728515625, 3.2005615234375, 3.683837890625, 4.1671142578125, 4.650390625, 5.1336669921875, 5.616943359375, 6.1002197265625, 6.58349609375, 7.0667724609375, 7.550048828125, 8.0333251953125, 8.5166015625, 8.9998779296875, 9.483154296875, 9.9664306640625, 10.44970703125, 10.9329833984375, 11.416259765625, 11.8995361328125, 12.3828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 13.0, 10.0, 27.0, 28.0, 61.0, 77.0, 102.0, 118.0, 145.0, 123.0, 85.0, 61.0, 37.0, 28.0, 13.0, 9.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.832050323486328e-05, -7.58785754442215e-05, -7.343664765357971e-05, -7.099471986293793e-05, -6.855279207229614e-05, -6.611086428165436e-05, -6.366893649101257e-05, -6.122700870037079e-05, -5.8785080909729004e-05, -5.634315311908722e-05, -5.3901225328445435e-05, -5.145929753780365e-05, -4.9017369747161865e-05, -4.657544195652008e-05, -4.4133514165878296e-05, -4.169158637523651e-05, -3.9249658584594727e-05, -3.680773079395294e-05, -3.436580300331116e-05, -3.192387521266937e-05, -2.9481947422027588e-05, -2.7040019631385803e-05, -2.459809184074402e-05, -2.2156164050102234e-05, -1.971423625946045e-05, -1.7272308468818665e-05, -1.483038067817688e-05, -1.2388452887535095e-05, -9.94652509689331e-06, -7.504597306251526e-06, -5.062669515609741e-06, -2.6207417249679565e-06, -1.7881393432617188e-07, 2.263113856315613e-06, 4.7050416469573975e-06, 7.146969437599182e-06, 9.588897228240967e-06, 1.2030825018882751e-05, 1.4472752809524536e-05, 1.691468060016632e-05, 1.9356608390808105e-05, 2.179853618144989e-05, 2.4240463972091675e-05, 2.668239176273346e-05, 2.9124319553375244e-05, 3.156624734401703e-05, 3.4008175134658813e-05, 3.64501029253006e-05, 3.889203071594238e-05, 4.133395850658417e-05, 4.377588629722595e-05, 4.621781408786774e-05, 4.865974187850952e-05, 5.1101669669151306e-05, 5.354359745979309e-05, 5.5985525250434875e-05, 5.842745304107666e-05, 6.0869380831718445e-05, 6.331130862236023e-05, 6.575323641300201e-05, 6.81951642036438e-05, 7.063709199428558e-05, 7.307901978492737e-05, 7.552094757556915e-05, 7.796287536621094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 13.0, 6.0, 20.0, 11.0, 26.0, 36.0, 50.0, 124.0, 265.0, 718.0, 1908.0, 6035.0, 45918.0, 913218.0, 69709.0, 6758.0, 2118.0, 808.0, 361.0, 153.0, 87.0, 50.0, 46.0, 31.0, 20.0, 17.0, 15.0, 14.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87353515625, -0.8288803100585938, -0.7842254638671875, -0.7395706176757812, -0.694915771484375, -0.6502609252929688, -0.6056060791015625, -0.5609512329101562, -0.51629638671875, -0.47164154052734375, -0.4269866943359375, -0.38233184814453125, -0.337677001953125, -0.29302215576171875, -0.2483673095703125, -0.20371246337890625, -0.1590576171875, -0.11440277099609375, -0.0697479248046875, -0.02509307861328125, 0.019561767578125, 0.06421661376953125, 0.1088714599609375, 0.15352630615234375, 0.19818115234375, 0.24283599853515625, 0.2874908447265625, 0.33214569091796875, 0.376800537109375, 0.42145538330078125, 0.4661102294921875, 0.5107650756835938, 0.555419921875, 0.6000747680664062, 0.6447296142578125, 0.6893844604492188, 0.734039306640625, 0.7786941528320312, 0.8233489990234375, 0.8680038452148438, 0.91265869140625, 0.9573135375976562, 1.0019683837890625, 1.0466232299804688, 1.091278076171875, 1.1359329223632812, 1.1805877685546875, 1.2252426147460938, 1.2698974609375, 1.3145523071289062, 1.3592071533203125, 1.4038619995117188, 1.448516845703125, 1.4931716918945312, 1.5378265380859375, 1.5824813842773438, 1.62713623046875, 1.6717910766601562, 1.7164459228515625, 1.7611007690429688, 1.805755615234375, 1.8504104614257812, 1.8950653076171875, 1.9397201538085938, 1.984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 7.0, 25.0, 64.0, 157.0, 285.0, 267.0, 114.0, 47.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5109176635742188, -0.4764251708984375, -0.44193267822265625, -0.407440185546875, -0.37294769287109375, -0.3384552001953125, -0.30396270751953125, -0.26947021484375, -0.23497772216796875, -0.2004852294921875, -0.16599273681640625, -0.131500244140625, -0.09700775146484375, -0.0625152587890625, -0.02802276611328125, 0.0064697265625, 0.04096221923828125, 0.0754547119140625, 0.10994720458984375, 0.144439697265625, 0.17893218994140625, 0.2134246826171875, 0.24791717529296875, 0.28240966796875, 0.31690216064453125, 0.3513946533203125, 0.38588714599609375, 0.420379638671875, 0.45487213134765625, 0.4893646240234375, 0.5238571166992188, 0.558349609375, 0.5928421020507812, 0.6273345947265625, 0.6618270874023438, 0.696319580078125, 0.7308120727539062, 0.7653045654296875, 0.7997970581054688, 0.83428955078125, 0.8687820434570312, 0.9032745361328125, 0.9377670288085938, 0.972259521484375, 1.0067520141601562, 1.0412445068359375, 1.0757369995117188, 1.1102294921875, 1.1447219848632812, 1.1792144775390625, 1.2137069702148438, 1.248199462890625, 1.2826919555664062, 1.3171844482421875, 1.3516769409179688, 1.38616943359375, 1.4206619262695312, 1.4551544189453125, 1.4896469116210938, 1.524139404296875, 1.5586318969726562, 1.5931243896484375, 1.6276168823242188, 1.662109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 31.0, 188.0, 387.0, 236.0, 77.0, 32.0, 21.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.526920318603516, -8.286758422851562, -8.046595573425293, -7.80643367767334, -7.566271781921387, -7.326109409332275, -7.085947513580322, -6.845785140991211, -6.605623245239258, -6.3654608726501465, -6.125298976898193, -5.885136604309082, -5.644974708557129, -5.404812335968018, -5.1646504402160645, -4.924488067626953, -4.684326171875, -4.444163799285889, -4.2040019035339355, -3.9638397693634033, -3.723677635192871, -3.4835152626037598, -3.2433533668518066, -3.0031909942626953, -2.763028621673584, -2.5228664875030518, -2.2827043533325195, -2.0425422191619873, -1.802380084991455, -1.5622178316116333, -1.322055697441101, -1.0818935632705688, -0.8417315483093262, -0.601569414138794, -0.36140725016593933, -0.12124508619308472, 0.11891704797744751, 0.3590792417526245, 0.5992413759231567, 0.839403510093689, 1.0795656442642212, 1.3197277784347534, 1.5598899126052856, 1.8000521659851074, 2.0402143001556396, 2.280376434326172, 2.520538568496704, 2.7607007026672363, 3.0008628368377686, 3.241024971008301, 3.481187105178833, 3.7213492393493652, 3.9615113735198975, 4.20167350769043, 4.441835880279541, 4.681997776031494, 4.9221601486206055, 5.162322521209717, 5.40248441696167, 5.642646789550781, 5.882808685302734, 6.122971057891846, 6.363132953643799, 6.60329532623291, 6.843457221984863]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 9.0, 8.0, 11.0, 20.0, 18.0, 31.0, 34.0, 55.0, 70.0, 65.0, 83.0, 76.0, 67.0, 88.0, 73.0, 63.0, 42.0, 33.0, 42.0, 23.0, 19.0, 18.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.629892110824585, -2.548163890838623, -2.4664359092712402, -2.3847079277038574, -2.3029797077178955, -2.2212514877319336, -2.139523506164551, -2.057795524597168, -1.976067304611206, -1.8943392038345337, -1.8126111030578613, -1.730883002281189, -1.6491549015045166, -1.5674268007278442, -1.4856986999511719, -1.4039705991744995, -1.3222424983978271, -1.2405143976211548, -1.1587862968444824, -1.07705819606781, -0.9953300952911377, -0.9136019945144653, -0.831873893737793, -0.7501457929611206, -0.6684176921844482, -0.5866895914077759, -0.5049614906311035, -0.42323338985443115, -0.3415052890777588, -0.2597771883010864, -0.17804908752441406, -0.0963209867477417, -0.014593124389648438, 0.06713497638702393, 0.1488630771636963, 0.23059117794036865, 0.312319278717041, 0.3940473794937134, 0.47577548027038574, 0.5575035810470581, 0.6392316818237305, 0.7209597826004028, 0.8026878833770752, 0.8844159841537476, 0.9661440849304199, 1.0478721857070923, 1.1296002864837646, 1.211328387260437, 1.2930564880371094, 1.3747845888137817, 1.456512689590454, 1.5382407903671265, 1.6199688911437988, 1.7016969919204712, 1.7834250926971436, 1.865153193473816, 1.9468812942504883, 2.028609275817871, 2.110337495803833, 2.192065715789795, 2.2737936973571777, 2.3555216789245605, 2.4372498989105225, 2.5189781188964844, 2.600706100463867]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 12.0, 19.0, 13.0, 28.0, 46.0, 44.0, 83.0, 134.0, 188.0, 317.0, 522.0, 938.0, 1934.0, 4007.0, 9714.0, 32197.0, 294030.0, 3717476.0, 99711.0, 19624.0, 6815.0, 2859.0, 1463.0, 788.0, 474.0, 290.0, 182.0, 130.0, 74.0, 42.0, 37.0, 28.0, 9.0, 10.0, 9.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1875, -1.15386962890625, -1.1202392578125, -1.08660888671875, -1.052978515625, -1.01934814453125, -0.9857177734375, -0.95208740234375, -0.91845703125, -0.88482666015625, -0.8511962890625, -0.81756591796875, -0.783935546875, -0.75030517578125, -0.7166748046875, -0.68304443359375, -0.6494140625, -0.61578369140625, -0.5821533203125, -0.54852294921875, -0.514892578125, -0.48126220703125, -0.4476318359375, -0.41400146484375, -0.38037109375, -0.34674072265625, -0.3131103515625, -0.27947998046875, -0.245849609375, -0.21221923828125, -0.1785888671875, -0.14495849609375, -0.111328125, -0.07769775390625, -0.0440673828125, -0.01043701171875, 0.023193359375, 0.05682373046875, 0.0904541015625, 0.12408447265625, 0.15771484375, 0.19134521484375, 0.2249755859375, 0.25860595703125, 0.292236328125, 0.32586669921875, 0.3594970703125, 0.39312744140625, 0.4267578125, 0.46038818359375, 0.4940185546875, 0.52764892578125, 0.561279296875, 0.59490966796875, 0.6285400390625, 0.66217041015625, 0.69580078125, 0.72943115234375, 0.7630615234375, 0.79669189453125, 0.830322265625, 0.86395263671875, 0.8975830078125, 0.93121337890625, 0.96484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 10.0, 7.0, 10.0, 16.0, 26.0, 36.0, 49.0, 46.0, 56.0, 74.0, 93.0, 99.0, 83.0, 79.0, 76.0, 61.0, 49.0, 35.0, 26.0, 12.0, 10.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.054355621337890625, -0.05283355712890625, -0.051311492919921875, -0.0497894287109375, -0.048267364501953125, -0.04674530029296875, -0.045223236083984375, -0.043701171875, -0.042179107666015625, -0.04065704345703125, -0.039134979248046875, -0.0376129150390625, -0.036090850830078125, -0.03456878662109375, -0.033046722412109375, -0.031524658203125, -0.030002593994140625, -0.02848052978515625, -0.026958465576171875, -0.0254364013671875, -0.023914337158203125, -0.02239227294921875, -0.020870208740234375, -0.01934814453125, -0.017826080322265625, -0.01630401611328125, -0.014781951904296875, -0.0132598876953125, -0.011737823486328125, -0.01021575927734375, -0.008693695068359375, -0.007171630859375, -0.005649566650390625, -0.00412750244140625, -0.002605438232421875, -0.0010833740234375, 0.000438690185546875, 0.00196075439453125, 0.003482818603515625, 0.0050048828125, 0.006526947021484375, 0.00804901123046875, 0.009571075439453125, 0.0110931396484375, 0.012615203857421875, 0.01413726806640625, 0.015659332275390625, 0.017181396484375, 0.018703460693359375, 0.02022552490234375, 0.021747589111328125, 0.0232696533203125, 0.024791717529296875, 0.02631378173828125, 0.027835845947265625, 0.02935791015625, 0.030879974365234375, 0.03240203857421875, 0.033924102783203125, 0.0354461669921875, 0.036968231201171875, 0.03849029541015625, 0.040012359619140625, 0.041534423828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 1.0, 2.0, 9.0, 2.0, 9.0, 7.0, 13.0, 8.0, 15.0, 10.0, 16.0, 14.0, 24.0, 34.0, 48.0, 82.0, 186.0, 554.0, 3230.0, 33016.0, 3285016.0, 849088.0, 19710.0, 2172.0, 479.0, 162.0, 105.0, 59.0, 44.0, 37.0, 25.0, 13.0, 14.0, 10.0, 5.0, 12.0, 10.0, 4.0, 6.0, 6.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.961669921875, -1.90380859375, -1.845947265625, -1.7880859375, -1.730224609375, -1.67236328125, -1.614501953125, -1.556640625, -1.498779296875, -1.44091796875, -1.383056640625, -1.3251953125, -1.267333984375, -1.20947265625, -1.151611328125, -1.09375, -1.035888671875, -0.97802734375, -0.920166015625, -0.8623046875, -0.804443359375, -0.74658203125, -0.688720703125, -0.630859375, -0.572998046875, -0.51513671875, -0.457275390625, -0.3994140625, -0.341552734375, -0.28369140625, -0.225830078125, -0.16796875, -0.110107421875, -0.05224609375, 0.005615234375, 0.0634765625, 0.121337890625, 0.17919921875, 0.237060546875, 0.294921875, 0.352783203125, 0.41064453125, 0.468505859375, 0.5263671875, 0.584228515625, 0.64208984375, 0.699951171875, 0.7578125, 0.815673828125, 0.87353515625, 0.931396484375, 0.9892578125, 1.047119140625, 1.10498046875, 1.162841796875, 1.220703125, 1.278564453125, 1.33642578125, 1.394287109375, 1.4521484375, 1.510009765625, 1.56787109375, 1.625732421875, 1.68359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 11.0, 12.0, 19.0, 30.0, 20.0, 32.0, 49.0, 60.0, 90.0, 161.0, 251.0, 504.0, 1016.0, 784.0, 379.0, 241.0, 114.0, 66.0, 46.0, 38.0, 17.0, 21.0, 18.0, 13.0, 11.0, 13.0, 12.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09705257415771484, -0.09400749206542969, -0.09096240997314453, -0.08791732788085938, -0.08487224578857422, -0.08182716369628906, -0.0787820816040039, -0.07573699951171875, -0.0726919174194336, -0.06964683532714844, -0.06660175323486328, -0.06355667114257812, -0.06051158905029297, -0.05746650695800781, -0.054421424865722656, -0.0513763427734375, -0.048331260681152344, -0.04528617858886719, -0.04224109649658203, -0.039196014404296875, -0.03615093231201172, -0.03310585021972656, -0.030060768127441406, -0.02701568603515625, -0.023970603942871094, -0.020925521850585938, -0.01788043975830078, -0.014835357666015625, -0.011790275573730469, -0.008745193481445312, -0.005700111389160156, -0.002655029296875, 0.00039005279541015625, 0.0034351348876953125, 0.006480216979980469, 0.009525299072265625, 0.012570381164550781, 0.015615463256835938, 0.018660545349121094, 0.02170562744140625, 0.024750709533691406, 0.027795791625976562, 0.03084087371826172, 0.033885955810546875, 0.03693103790283203, 0.03997611999511719, 0.043021202087402344, 0.0460662841796875, 0.049111366271972656, 0.05215644836425781, 0.05520153045654297, 0.058246612548828125, 0.06129169464111328, 0.06433677673339844, 0.0673818588256836, 0.07042694091796875, 0.0734720230102539, 0.07651710510253906, 0.07956218719482422, 0.08260726928710938, 0.08565235137939453, 0.08869743347167969, 0.09174251556396484, 0.09478759765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 13.0, 65.0, 239.0, 405.0, 214.0, 49.0, 16.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.727738857269287, -3.654149293899536, -3.5805599689483643, -3.5069704055786133, -3.4333808422088623, -3.3597915172576904, -3.2862019538879395, -3.2126126289367676, -3.1390230655670166, -3.0654335021972656, -2.9918441772460938, -2.9182546138763428, -2.844665050506592, -2.77107572555542, -2.697486162185669, -2.623896598815918, -2.550307273864746, -2.476717710494995, -2.4031283855438232, -2.3295388221740723, -2.2559492588043213, -2.1823599338531494, -2.1087703704833984, -2.0351810455322266, -1.9615912437438965, -1.888001799583435, -1.814412236213684, -1.7408227920532227, -1.6672333478927612, -1.5936439037322998, -1.5200543403625488, -1.4464648962020874, -1.372875452041626, -1.2992860078811646, -1.2256964445114136, -1.1521070003509521, -1.0785175561904907, -1.0049281120300293, -0.9313385486602783, -0.8577491044998169, -0.7841596603393555, -0.7105701565742493, -0.6369807124137878, -0.5633912086486816, -0.4898017346858978, -0.416212260723114, -0.3426227569580078, -0.2690333127975464, -0.19544380903244019, -0.12185432761907578, -0.048264846205711365, 0.025324642658233643, 0.09891411662101746, 0.17250359058380127, 0.24609309434890747, 0.3196825385093689, 0.3932720422744751, 0.4668615162372589, 0.5404509902000427, 0.6140404939651489, 0.6876299381256104, 0.7612194418907166, 0.8348089456558228, 0.9083983898162842, 0.9819878935813904]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 12.0, 17.0, 15.0, 17.0, 32.0, 31.0, 47.0, 57.0, 55.0, 78.0, 64.0, 64.0, 79.0, 61.0, 65.0, 67.0, 54.0, 42.0, 34.0, 22.0, 12.0, 22.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41616570949554443, -0.39932334423065186, -0.38248100876808167, -0.3656386435031891, -0.3487963080406189, -0.3319539427757263, -0.31511157751083374, -0.29826921224594116, -0.28142687678337097, -0.2645845115184784, -0.2477421760559082, -0.23089981079101562, -0.21405746042728424, -0.19721511006355286, -0.18037274479866028, -0.1635303944349289, -0.1466880440711975, -0.12984569370746613, -0.11300333589315414, -0.09616097807884216, -0.07931862771511078, -0.062476277351379395, -0.04563391953706741, -0.028791561722755432, -0.011949211359024048, 0.004893142729997635, 0.021735496819019318, 0.038577850908041, 0.05542020499706268, 0.07226255536079407, 0.08910491317510605, 0.10594727098941803, 0.12278968095779419, 0.13963203132152557, 0.15647438168525696, 0.17331674695014954, 0.19015909731388092, 0.2070014476776123, 0.22384381294250488, 0.24068616330623627, 0.25752851366996765, 0.27437087893486023, 0.2912132143974304, 0.308055579662323, 0.3248979449272156, 0.34174028038978577, 0.35858264565467834, 0.37542498111724854, 0.3922673463821411, 0.4091097116470337, 0.4259520471096039, 0.44279441237449646, 0.45963674783706665, 0.47647911310195923, 0.4933214783668518, 0.5101638436317444, 0.5270061492919922, 0.5438485145568848, 0.5606908798217773, 0.5775331854820251, 0.5943755507469177, 0.6112179160118103, 0.6280602812767029, 0.6449026465415955, 0.661745011806488]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 6.0, 8.0, 9.0, 18.0, 21.0, 29.0, 49.0, 38.0, 55.0, 58.0, 139.0, 1873.0, 491584.0, 552162.0, 2021.0, 161.0, 74.0, 58.0, 35.0, 42.0, 29.0, 22.0, 16.0, 14.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.53265380859375, -2.4559326171875, -2.37921142578125, -2.302490234375, -2.22576904296875, -2.1490478515625, -2.07232666015625, -1.99560546875, -1.91888427734375, -1.8421630859375, -1.76544189453125, -1.688720703125, -1.61199951171875, -1.5352783203125, -1.45855712890625, -1.3818359375, -1.30511474609375, -1.2283935546875, -1.15167236328125, -1.074951171875, -0.99822998046875, -0.9215087890625, -0.84478759765625, -0.76806640625, -0.69134521484375, -0.6146240234375, -0.53790283203125, -0.461181640625, -0.38446044921875, -0.3077392578125, -0.23101806640625, -0.154296875, -0.07757568359375, -0.0008544921875, 0.07586669921875, 0.152587890625, 0.22930908203125, 0.3060302734375, 0.38275146484375, 0.45947265625, 0.53619384765625, 0.6129150390625, 0.68963623046875, 0.766357421875, 0.84307861328125, 0.9197998046875, 0.99652099609375, 1.0732421875, 1.14996337890625, 1.2266845703125, 1.30340576171875, 1.380126953125, 1.45684814453125, 1.5335693359375, 1.61029052734375, 1.68701171875, 1.76373291015625, 1.8404541015625, 1.91717529296875, 1.993896484375, 2.07061767578125, 2.1473388671875, 2.22406005859375, 2.30078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 21.0, 60.0, 82.0, 126.0, 175.0, 171.0, 134.0, 97.0, 64.0, 34.0, 9.0, 8.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042449951171875, -0.03945016860961914, -0.03645038604736328, -0.03345060348510742, -0.030450820922851562, -0.027451038360595703, -0.024451255798339844, -0.021451473236083984, -0.018451690673828125, -0.015451908111572266, -0.012452125549316406, -0.009452342987060547, -0.0064525604248046875, -0.003452777862548828, -0.00045299530029296875, 0.0025467872619628906, 0.00554656982421875, 0.00854635238647461, 0.011546134948730469, 0.014545917510986328, 0.017545700073242188, 0.020545482635498047, 0.023545265197753906, 0.026545047760009766, 0.029544830322265625, 0.032544612884521484, 0.035544395446777344, 0.0385441780090332, 0.04154396057128906, 0.04454374313354492, 0.04754352569580078, 0.05054330825805664, 0.0535430908203125, 0.05654287338256836, 0.05954265594482422, 0.06254243850708008, 0.06554222106933594, 0.0685420036315918, 0.07154178619384766, 0.07454156875610352, 0.07754135131835938, 0.08054113388061523, 0.0835409164428711, 0.08654069900512695, 0.08954048156738281, 0.09254026412963867, 0.09554004669189453, 0.09853982925415039, 0.10153961181640625, 0.10453939437866211, 0.10753917694091797, 0.11053895950317383, 0.11353874206542969, 0.11653852462768555, 0.1195383071899414, 0.12253808975219727, 0.12553787231445312, 0.12853765487670898, 0.13153743743896484, 0.1345372200012207, 0.13753700256347656, 0.14053678512573242, 0.14353656768798828, 0.14653635025024414, 0.1495361328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 11.0, 11.0, 15.0, 15.0, 25.0, 33.0, 36.0, 71.0, 112.0, 158.0, 290.0, 437.0, 871.0, 1783.0, 4181.0, 10585.0, 31701.0, 97359.0, 257470.0, 351644.0, 190408.0, 65949.0, 21622.0, 7532.0, 3170.0, 1309.0, 715.0, 369.0, 238.0, 139.0, 80.0, 70.0, 38.0, 33.0, 17.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.45849609375, -0.4447364807128906, -0.43097686767578125, -0.4172172546386719, -0.4034576416015625, -0.3896980285644531, -0.37593841552734375, -0.3621788024902344, -0.348419189453125, -0.3346595764160156, -0.32089996337890625, -0.3071403503417969, -0.2933807373046875, -0.2796211242675781, -0.26586151123046875, -0.2521018981933594, -0.23834228515625, -0.22458267211914062, -0.21082305908203125, -0.19706344604492188, -0.1833038330078125, -0.16954421997070312, -0.15578460693359375, -0.14202499389648438, -0.128265380859375, -0.11450576782226562, -0.10074615478515625, -0.08698654174804688, -0.0732269287109375, -0.059467315673828125, -0.04570770263671875, -0.031948089599609375, -0.0181884765625, -0.004428863525390625, 0.00933074951171875, 0.023090362548828125, 0.0368499755859375, 0.050609588623046875, 0.06436920166015625, 0.07812881469726562, 0.091888427734375, 0.10564804077148438, 0.11940765380859375, 0.13316726684570312, 0.1469268798828125, 0.16068649291992188, 0.17444610595703125, 0.18820571899414062, 0.20196533203125, 0.21572494506835938, 0.22948455810546875, 0.24324417114257812, 0.2570037841796875, 0.2707633972167969, 0.28452301025390625, 0.2982826232910156, 0.312042236328125, 0.3258018493652344, 0.33956146240234375, 0.3533210754394531, 0.3670806884765625, 0.3808403015136719, 0.39459991455078125, 0.4083595275878906, 0.422119140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 9.0, 26.0, 19.0, 23.0, 28.0, 36.0, 34.0, 32.0, 43.0, 47.0, 55.0, 47.0, 48.0, 53.0, 46.0, 42.0, 45.0, 43.0, 41.0, 30.0, 40.0, 31.0, 24.0, 16.0, 19.0, 21.0, 12.0, 9.0, 6.0, 11.0, 6.0, 8.0, 2.0, 6.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2210693359375, -0.21459579467773438, -0.20812225341796875, -0.20164871215820312, -0.1951751708984375, -0.18870162963867188, -0.18222808837890625, -0.17575454711914062, -0.169281005859375, -0.16280746459960938, -0.15633392333984375, -0.14986038208007812, -0.1433868408203125, -0.13691329956054688, -0.13043975830078125, -0.12396621704101562, -0.11749267578125, -0.11101913452148438, -0.10454559326171875, -0.09807205200195312, -0.0915985107421875, -0.08512496948242188, -0.07865142822265625, -0.07217788696289062, -0.065704345703125, -0.059230804443359375, -0.05275726318359375, -0.046283721923828125, -0.0398101806640625, -0.033336639404296875, -0.02686309814453125, -0.020389556884765625, -0.013916015625, -0.007442474365234375, -0.00096893310546875, 0.005504608154296875, 0.0119781494140625, 0.018451690673828125, 0.02492523193359375, 0.031398773193359375, 0.037872314453125, 0.044345855712890625, 0.05081939697265625, 0.057292938232421875, 0.0637664794921875, 0.07024002075195312, 0.07671356201171875, 0.08318710327148438, 0.08966064453125, 0.09613418579101562, 0.10260772705078125, 0.10908126831054688, 0.1155548095703125, 0.12202835083007812, 0.12850189208984375, 0.13497543334960938, 0.141448974609375, 0.14792251586914062, 0.15439605712890625, 0.16086959838867188, 0.1673431396484375, 0.17381668090820312, 0.18029022216796875, 0.18676376342773438, 0.1932373046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 10.0, 3.0, 4.0, 9.0, 8.0, 11.0, 14.0, 18.0, 34.0, 35.0, 63.0, 106.0, 187.0, 329.0, 591.0, 1352.0, 3212.0, 9622.0, 37998.0, 210187.0, 558576.0, 178843.0, 32943.0, 8726.0, 3033.0, 1274.0, 570.0, 322.0, 159.0, 99.0, 56.0, 43.0, 23.0, 37.0, 13.0, 10.0, 10.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.57275390625, -0.555633544921875, -0.53851318359375, -0.521392822265625, -0.5042724609375, -0.487152099609375, -0.47003173828125, -0.452911376953125, -0.435791015625, -0.418670654296875, -0.40155029296875, -0.384429931640625, -0.3673095703125, -0.350189208984375, -0.33306884765625, -0.315948486328125, -0.298828125, -0.281707763671875, -0.26458740234375, -0.247467041015625, -0.2303466796875, -0.213226318359375, -0.19610595703125, -0.178985595703125, -0.161865234375, -0.144744873046875, -0.12762451171875, -0.110504150390625, -0.0933837890625, -0.076263427734375, -0.05914306640625, -0.042022705078125, -0.02490234375, -0.007781982421875, 0.00933837890625, 0.026458740234375, 0.0435791015625, 0.060699462890625, 0.07781982421875, 0.094940185546875, 0.112060546875, 0.129180908203125, 0.14630126953125, 0.163421630859375, 0.1805419921875, 0.197662353515625, 0.21478271484375, 0.231903076171875, 0.2490234375, 0.266143798828125, 0.28326416015625, 0.300384521484375, 0.3175048828125, 0.334625244140625, 0.35174560546875, 0.368865966796875, 0.385986328125, 0.403106689453125, 0.42022705078125, 0.437347412109375, 0.4544677734375, 0.471588134765625, 0.48870849609375, 0.505828857421875, 0.52294921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 11.0, 9.0, 17.0, 22.0, 40.0, 54.0, 82.0, 120.0, 129.0, 137.0, 114.0, 88.0, 53.0, 42.0, 26.0, 18.0, 14.0, 9.0, 7.0, 1.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.508827209472656e-05, -6.214901804924011e-05, -5.920976400375366e-05, -5.627050995826721e-05, -5.333125591278076e-05, -5.039200186729431e-05, -4.745274782180786e-05, -4.451349377632141e-05, -4.157423973083496e-05, -3.863498568534851e-05, -3.569573163986206e-05, -3.275647759437561e-05, -2.981722354888916e-05, -2.687796950340271e-05, -2.393871545791626e-05, -2.099946141242981e-05, -1.806020736694336e-05, -1.512095332145691e-05, -1.2181699275970459e-05, -9.242445230484009e-06, -6.303191184997559e-06, -3.3639371395111084e-06, -4.246830940246582e-07, 2.514570951461792e-06, 5.453824996948242e-06, 8.393079042434692e-06, 1.1332333087921143e-05, 1.4271587133407593e-05, 1.7210841178894043e-05, 2.0150095224380493e-05, 2.3089349269866943e-05, 2.6028603315353394e-05, 2.8967857360839844e-05, 3.1907111406326294e-05, 3.4846365451812744e-05, 3.7785619497299194e-05, 4.0724873542785645e-05, 4.3664127588272095e-05, 4.6603381633758545e-05, 4.9542635679244995e-05, 5.2481889724731445e-05, 5.5421143770217896e-05, 5.8360397815704346e-05, 6.12996518611908e-05, 6.423890590667725e-05, 6.71781599521637e-05, 7.011741399765015e-05, 7.30566680431366e-05, 7.599592208862305e-05, 7.89351761341095e-05, 8.187443017959595e-05, 8.48136842250824e-05, 8.775293827056885e-05, 9.06921923160553e-05, 9.363144636154175e-05, 9.65707004070282e-05, 9.950995445251465e-05, 0.0001024492084980011, 0.00010538846254348755, 0.000108327716588974, 0.00011126697063446045, 0.0001142062246799469, 0.00011714547872543335, 0.0001200847327709198, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 15.0, 21.0, 41.0, 46.0, 88.0, 143.0, 228.0, 504.0, 1015.0, 2640.0, 8468.0, 44524.0, 597169.0, 356168.0, 27498.0, 6186.0, 2034.0, 799.0, 406.0, 217.0, 120.0, 68.0, 46.0, 39.0, 17.0, 8.0, 4.0, 6.0, 5.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7315750122070312, -0.7009429931640625, -0.6703109741210938, -0.639678955078125, -0.6090469360351562, -0.5784149169921875, -0.5477828979492188, -0.51715087890625, -0.48651885986328125, -0.4558868408203125, -0.42525482177734375, -0.394622802734375, -0.36399078369140625, -0.3333587646484375, -0.30272674560546875, -0.2720947265625, -0.24146270751953125, -0.2108306884765625, -0.18019866943359375, -0.149566650390625, -0.11893463134765625, -0.0883026123046875, -0.05767059326171875, -0.02703857421875, 0.00359344482421875, 0.0342254638671875, 0.06485748291015625, 0.095489501953125, 0.12612152099609375, 0.1567535400390625, 0.18738555908203125, 0.218017578125, 0.24864959716796875, 0.2792816162109375, 0.30991363525390625, 0.340545654296875, 0.37117767333984375, 0.4018096923828125, 0.43244171142578125, 0.46307373046875, 0.49370574951171875, 0.5243377685546875, 0.5549697875976562, 0.585601806640625, 0.6162338256835938, 0.6468658447265625, 0.6774978637695312, 0.7081298828125, 0.7387619018554688, 0.7693939208984375, 0.8000259399414062, 0.830657958984375, 0.8612899780273438, 0.8919219970703125, 0.9225540161132812, 0.95318603515625, 0.9838180541992188, 1.0144500732421875, 1.0450820922851562, 1.075714111328125, 1.1063461303710938, 1.1369781494140625, 1.1676101684570312, 1.1982421875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 2.0, 8.0, 15.0, 8.0, 11.0, 19.0, 21.0, 53.0, 76.0, 79.0, 111.0, 132.0, 110.0, 95.0, 83.0, 48.0, 40.0, 21.0, 14.0, 10.0, 9.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.43135833740234375, -0.4196014404296875, -0.40784454345703125, -0.396087646484375, -0.38433074951171875, -0.3725738525390625, -0.36081695556640625, -0.34906005859375, -0.33730316162109375, -0.3255462646484375, -0.31378936767578125, -0.302032470703125, -0.29027557373046875, -0.2785186767578125, -0.26676177978515625, -0.2550048828125, -0.24324798583984375, -0.2314910888671875, -0.21973419189453125, -0.207977294921875, -0.19622039794921875, -0.1844635009765625, -0.17270660400390625, -0.16094970703125, -0.14919281005859375, -0.1374359130859375, -0.12567901611328125, -0.113922119140625, -0.10216522216796875, -0.0904083251953125, -0.07865142822265625, -0.06689453125, -0.05513763427734375, -0.0433807373046875, -0.03162384033203125, -0.019866943359375, -0.00811004638671875, 0.0036468505859375, 0.01540374755859375, 0.02716064453125, 0.03891754150390625, 0.0506744384765625, 0.06243133544921875, 0.074188232421875, 0.08594512939453125, 0.0977020263671875, 0.10945892333984375, 0.1212158203125, 0.13297271728515625, 0.1447296142578125, 0.15648651123046875, 0.168243408203125, 0.18000030517578125, 0.1917572021484375, 0.20351409912109375, 0.21527099609375, 0.22702789306640625, 0.2387847900390625, 0.25054168701171875, 0.262298583984375, 0.27405548095703125, 0.2858123779296875, 0.29756927490234375, 0.309326171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 9.0, 12.0, 30.0, 62.0, 189.0, 315.0, 244.0, 104.0, 24.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.983085632324219, -5.730259418487549, -5.477432727813721, -5.224606513977051, -4.971779823303223, -4.718953609466553, -4.466127395629883, -4.213300704956055, -3.9604744911193848, -3.7076480388641357, -3.4548215866088867, -3.201995372772217, -2.9491689205169678, -2.6963424682617188, -2.443516254425049, -2.1906898021698, -1.9378633499145508, -1.6850368976593018, -1.4322105646133423, -1.1793842315673828, -0.9265577793121338, -0.6737313270568848, -0.4209049940109253, -0.16807866096496582, 0.0847477912902832, 0.33757418394088745, 0.5904005765914917, 0.843226969242096, 1.0960533618927002, 1.3488798141479492, 1.6017061471939087, 1.8545324802398682, 2.107358932495117, 2.360185384750366, 2.6130118370056152, 2.865838050842285, 3.118664503097534, 3.371490955352783, 3.624317169189453, 3.877143621444702, 4.129970073699951, 4.382796287536621, 4.635622978210449, 4.888449192047119, 5.141275405883789, 5.394102096557617, 5.646928310394287, 5.899754524230957, 6.152581214904785, 6.405407428741455, 6.658234119415283, 6.911060333251953, 7.163887023925781, 7.416713237762451, 7.669539451599121, 7.922366142272949, 8.175191879272461, 8.428018569946289, 8.6808443069458, 8.933670997619629, 9.186497688293457, 9.439323425292969, 9.692150115966797, 9.944976806640625, 10.197803497314453]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 25.0, 57.0, 74.0, 99.0, 139.0, 134.0, 139.0, 115.0, 91.0, 63.0, 38.0, 16.0, 10.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6718108654022217, -1.534712314605713, -1.397613763809204, -1.2605152130126953, -1.1234166622161865, -0.9863181114196777, -0.849219560623169, -0.7121210098266602, -0.5750224590301514, -0.4379239082336426, -0.3008253574371338, -0.163726806640625, -0.02662825584411621, 0.11047029495239258, 0.24756884574890137, 0.38466739654541016, 0.521765947341919, 0.6588644981384277, 0.7959630489349365, 0.9330615997314453, 1.070160150527954, 1.207258701324463, 1.3443572521209717, 1.4814558029174805, 1.6185543537139893, 1.755652904510498, 1.8927514553070068, 2.0298500061035156, 2.1669485569000244, 2.304047107696533, 2.441145658493042, 2.578244209289551, 2.7153429985046387, 2.8524415493011475, 2.9895401000976562, 3.126638650894165, 3.263737201690674, 3.4008357524871826, 3.5379343032836914, 3.6750328540802, 3.812131404876709, 3.9492299556732178, 4.086328506469727, 4.223426818847656, 4.360525608062744, 4.497624397277832, 4.634722709655762, 4.771821022033691, 4.908919811248779, 5.046018600463867, 5.183116912841797, 5.320215225219727, 5.4573140144348145, 5.594412803649902, 5.731511116027832, 5.868609428405762, 6.00570821762085, 6.1428070068359375, 6.279905319213867, 6.417003631591797, 6.554102420806885, 6.691201210021973, 6.828299522399902, 6.965397834777832, 7.10249662399292]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 14.0, 22.0, 72.0, 167.0, 691.0, 17208.0, 4157771.0, 16905.0, 775.0, 243.0, 116.0, 79.0, 40.0, 33.0, 39.0, 25.0, 22.0, 16.0, 12.0, 8.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.02093505859375, -2.8660888671875, -2.71124267578125, -2.556396484375, -2.40155029296875, -2.2467041015625, -2.09185791015625, -1.93701171875, -1.78216552734375, -1.6273193359375, -1.47247314453125, -1.317626953125, -1.16278076171875, -1.0079345703125, -0.85308837890625, -0.6982421875, -0.54339599609375, -0.3885498046875, -0.23370361328125, -0.078857421875, 0.07598876953125, 0.2308349609375, 0.38568115234375, 0.54052734375, 0.69537353515625, 0.8502197265625, 1.00506591796875, 1.159912109375, 1.31475830078125, 1.4696044921875, 1.62445068359375, 1.779296875, 1.93414306640625, 2.0889892578125, 2.24383544921875, 2.398681640625, 2.55352783203125, 2.7083740234375, 2.86322021484375, 3.01806640625, 3.17291259765625, 3.3277587890625, 3.48260498046875, 3.637451171875, 3.79229736328125, 3.9471435546875, 4.10198974609375, 4.2568359375, 4.41168212890625, 4.5665283203125, 4.72137451171875, 4.876220703125, 5.03106689453125, 5.1859130859375, 5.34075927734375, 5.49560546875, 5.65045166015625, 5.8052978515625, 5.96014404296875, 6.114990234375, 6.26983642578125, 6.4246826171875, 6.57952880859375, 6.734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 11.0, 16.0, 44.0, 67.0, 99.0, 186.0, 167.0, 157.0, 121.0, 76.0, 33.0, 17.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.07967758178710938, -0.07537078857421875, -0.07106399536132812, -0.0667572021484375, -0.062450408935546875, -0.05814361572265625, -0.053836822509765625, -0.049530029296875, -0.045223236083984375, -0.04091644287109375, -0.036609649658203125, -0.0323028564453125, -0.027996063232421875, -0.02368927001953125, -0.019382476806640625, -0.01507568359375, -0.010768890380859375, -0.00646209716796875, -0.002155303955078125, 0.0021514892578125, 0.006458282470703125, 0.01076507568359375, 0.015071868896484375, 0.019378662109375, 0.023685455322265625, 0.02799224853515625, 0.032299041748046875, 0.0366058349609375, 0.040912628173828125, 0.04521942138671875, 0.049526214599609375, 0.0538330078125, 0.058139801025390625, 0.06244659423828125, 0.06675338745117188, 0.0710601806640625, 0.07536697387695312, 0.07967376708984375, 0.08398056030273438, 0.088287353515625, 0.09259414672851562, 0.09690093994140625, 0.10120773315429688, 0.1055145263671875, 0.10982131958007812, 0.11412811279296875, 0.11843490600585938, 0.12274169921875, 0.12704849243164062, 0.13135528564453125, 0.13566207885742188, 0.1399688720703125, 0.14427566528320312, 0.14858245849609375, 0.15288925170898438, 0.157196044921875, 0.16150283813476562, 0.16580963134765625, 0.17011642456054688, 0.1744232177734375, 0.17873001098632812, 0.18303680419921875, 0.18734359741210938, 0.191650390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 11.0, 9.0, 22.0, 33.0, 66.0, 120.0, 165.0, 343.0, 792.0, 6083.0, 4030038.0, 153601.0, 1913.0, 520.0, 249.0, 148.0, 75.0, 41.0, 27.0, 14.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.889678955078125, -7.72467041015625, -7.559661865234375, -7.3946533203125, -7.229644775390625, -7.06463623046875, -6.899627685546875, -6.734619140625, -6.569610595703125, -6.40460205078125, -6.239593505859375, -6.0745849609375, -5.909576416015625, -5.74456787109375, -5.579559326171875, -5.41455078125, -5.249542236328125, -5.08453369140625, -4.919525146484375, -4.7545166015625, -4.589508056640625, -4.42449951171875, -4.259490966796875, -4.094482421875, -3.929473876953125, -3.76446533203125, -3.599456787109375, -3.4344482421875, -3.269439697265625, -3.10443115234375, -2.939422607421875, -2.7744140625, -2.609405517578125, -2.44439697265625, -2.279388427734375, -2.1143798828125, -1.949371337890625, -1.78436279296875, -1.619354248046875, -1.454345703125, -1.289337158203125, -1.12432861328125, -0.959320068359375, -0.7943115234375, -0.629302978515625, -0.46429443359375, -0.299285888671875, -0.13427734375, 0.030731201171875, 0.19573974609375, 0.360748291015625, 0.5257568359375, 0.690765380859375, 0.85577392578125, 1.020782470703125, 1.185791015625, 1.350799560546875, 1.51580810546875, 1.680816650390625, 1.8458251953125, 2.010833740234375, 2.17584228515625, 2.340850830078125, 2.505859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 10.0, 29.0, 44.0, 120.0, 459.0, 2543.0, 630.0, 151.0, 53.0, 26.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6928024291992188, -0.6775970458984375, -0.6623916625976562, -0.647186279296875, -0.6319808959960938, -0.6167755126953125, -0.6015701293945312, -0.58636474609375, -0.5711593627929688, -0.5559539794921875, -0.5407485961914062, -0.525543212890625, -0.5103378295898438, -0.4951324462890625, -0.47992706298828125, -0.4647216796875, -0.44951629638671875, -0.4343109130859375, -0.41910552978515625, -0.403900146484375, -0.38869476318359375, -0.3734893798828125, -0.35828399658203125, -0.34307861328125, -0.32787322998046875, -0.3126678466796875, -0.29746246337890625, -0.282257080078125, -0.26705169677734375, -0.2518463134765625, -0.23664093017578125, -0.221435546875, -0.20623016357421875, -0.1910247802734375, -0.17581939697265625, -0.160614013671875, -0.14540863037109375, -0.1302032470703125, -0.11499786376953125, -0.09979248046875, -0.08458709716796875, -0.0693817138671875, -0.05417633056640625, -0.038970947265625, -0.02376556396484375, -0.0085601806640625, 0.00664520263671875, 0.0218505859375, 0.03705596923828125, 0.0522613525390625, 0.06746673583984375, 0.082672119140625, 0.09787750244140625, 0.1130828857421875, 0.12828826904296875, 0.14349365234375, 0.15869903564453125, 0.1739044189453125, 0.18910980224609375, 0.204315185546875, 0.21952056884765625, 0.2347259521484375, 0.24993133544921875, 0.26513671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 28.0, 125.0, 452.0, 320.0, 61.0, 14.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.045211791992188, -9.825933456420898, -9.60665512084961, -9.387377738952637, -9.168099403381348, -8.948821067810059, -8.72954273223877, -8.51026439666748, -8.290987014770508, -8.071708679199219, -7.852430820465088, -7.633152484893799, -7.413874626159668, -7.194596290588379, -6.97531795501709, -6.756040096282959, -6.536761283874512, -6.317482948303223, -6.098205089569092, -5.878926753997803, -5.659648895263672, -5.440370559692383, -5.221092224121094, -5.001814365386963, -4.782536506652832, -4.563258171081543, -4.343980312347412, -4.124701976776123, -3.905423879623413, -3.686145782470703, -3.466867685317993, -3.247589588165283, -3.0283114910125732, -2.8090333938598633, -2.5897552967071533, -2.3704771995544434, -2.1511988639831543, -1.9319207668304443, -1.7126426696777344, -1.4933644533157349, -1.274086356163025, -1.054808259010315, -0.8355300426483154, -0.6162519454956055, -0.39697378873825073, -0.177695631980896, 0.041582465171813965, 0.2608606815338135, 0.48013877868652344, 0.6994169354438782, 0.9186950922012329, 1.1379731893539429, 1.3572514057159424, 1.5765295028686523, 1.7958076000213623, 2.0150856971740723, 2.2343640327453613, 2.4536421298980713, 2.6729202270507812, 2.8921985626220703, 3.1114766597747803, 3.3307547569274902, 3.5500328540802, 3.76931095123291, 3.98858904838562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 19.0, 22.0, 41.0, 44.0, 68.0, 70.0, 95.0, 118.0, 106.0, 108.0, 93.0, 63.0, 51.0, 39.0, 24.0, 15.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1679043769836426, -1.1115180253982544, -1.0551316738128662, -0.9987452626228333, -0.9423588514328003, -0.8859724998474121, -0.8295861482620239, -0.773199737071991, -0.716813325881958, -0.6604269742965698, -0.6040405631065369, -0.5476542115211487, -0.4912678003311157, -0.43488144874572754, -0.37849506735801697, -0.3221086859703064, -0.2657223343849182, -0.20933595299720764, -0.15294957160949707, -0.09656320512294769, -0.04017682373523712, 0.016209542751312256, 0.07259592413902283, 0.1289823055267334, 0.18536868691444397, 0.24175506830215454, 0.2981414496898651, 0.3545278310775757, 0.41091418266296387, 0.46730056405067444, 0.523686945438385, 0.580073356628418, 0.6364597082138062, 0.6928460597991943, 0.7492324709892273, 0.8056188225746155, 0.8620052337646484, 0.9183915853500366, 0.9747779369354248, 1.0311644077301025, 1.0875507593154907, 1.143937110900879, 1.200323462486267, 1.2567099332809448, 1.313096284866333, 1.3694826364517212, 1.4258689880371094, 1.482255458831787, 1.5386416912078857, 1.595028042793274, 1.651414394378662, 1.7078008651733398, 1.764187216758728, 1.8205735683441162, 1.8769599199295044, 1.9333462715148926, 1.9897327423095703, 2.046119213104248, 2.1025054454803467, 2.1588919162750244, 2.215278148651123, 2.271664619445801, 2.3280510902404785, 2.384437322616577, 2.440823793411255]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 9.0, 12.0, 20.0, 38.0, 51.0, 71.0, 127.0, 243.0, 599.0, 1860.0, 11883.0, 250595.0, 734294.0, 42759.0, 4026.0, 995.0, 385.0, 186.0, 107.0, 57.0, 49.0, 29.0, 19.0, 16.0, 9.0, 14.0, 12.0, 11.0, 10.0, 9.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.378662109375, -1.32177734375, -1.264892578125, -1.2080078125, -1.151123046875, -1.09423828125, -1.037353515625, -0.98046875, -0.923583984375, -0.86669921875, -0.809814453125, -0.7529296875, -0.696044921875, -0.63916015625, -0.582275390625, -0.525390625, -0.468505859375, -0.41162109375, -0.354736328125, -0.2978515625, -0.240966796875, -0.18408203125, -0.127197265625, -0.0703125, -0.013427734375, 0.04345703125, 0.100341796875, 0.1572265625, 0.214111328125, 0.27099609375, 0.327880859375, 0.384765625, 0.441650390625, 0.49853515625, 0.555419921875, 0.6123046875, 0.669189453125, 0.72607421875, 0.782958984375, 0.83984375, 0.896728515625, 0.95361328125, 1.010498046875, 1.0673828125, 1.124267578125, 1.18115234375, 1.238037109375, 1.294921875, 1.351806640625, 1.40869140625, 1.465576171875, 1.5224609375, 1.579345703125, 1.63623046875, 1.693115234375, 1.75, 1.806884765625, 1.86376953125, 1.920654296875, 1.9775390625, 2.034423828125, 2.09130859375, 2.148193359375, 2.205078125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 13.0, 23.0, 36.0, 49.0, 82.0, 95.0, 118.0, 119.0, 119.0, 101.0, 85.0, 64.0, 41.0, 20.0, 14.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11210155487060547, -0.10817527770996094, -0.1042490005493164, -0.10032272338867188, -0.09639644622802734, -0.09247016906738281, -0.08854389190673828, -0.08461761474609375, -0.08069133758544922, -0.07676506042480469, -0.07283878326416016, -0.06891250610351562, -0.0649862289428711, -0.06105995178222656, -0.05713367462158203, -0.0532073974609375, -0.04928112030029297, -0.04535484313964844, -0.041428565979003906, -0.037502288818359375, -0.033576011657714844, -0.029649734497070312, -0.02572345733642578, -0.02179718017578125, -0.01787090301513672, -0.013944625854492188, -0.010018348693847656, -0.006092071533203125, -0.0021657943725585938, 0.0017604827880859375, 0.005686759948730469, 0.009613037109375, 0.013539314270019531, 0.017465591430664062, 0.021391868591308594, 0.025318145751953125, 0.029244422912597656, 0.03317070007324219, 0.03709697723388672, 0.04102325439453125, 0.04494953155517578, 0.04887580871582031, 0.052802085876464844, 0.056728363037109375, 0.060654640197753906, 0.06458091735839844, 0.06850719451904297, 0.0724334716796875, 0.07635974884033203, 0.08028602600097656, 0.0842123031616211, 0.08813858032226562, 0.09206485748291016, 0.09599113464355469, 0.09991741180419922, 0.10384368896484375, 0.10776996612548828, 0.11169624328613281, 0.11562252044677734, 0.11954879760742188, 0.1234750747680664, 0.12740135192871094, 0.13132762908935547, 0.13525390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 3.0, 5.0, 16.0, 21.0, 15.0, 28.0, 36.0, 56.0, 86.0, 119.0, 191.0, 340.0, 612.0, 1216.0, 2620.0, 7358.0, 26284.0, 117106.0, 422931.0, 353565.0, 86005.0, 19475.0, 5851.0, 2275.0, 1008.0, 487.0, 289.0, 176.0, 124.0, 79.0, 45.0, 27.0, 31.0, 18.0, 16.0, 9.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0], "bins": [-0.80615234375, -0.784881591796875, -0.76361083984375, -0.742340087890625, -0.7210693359375, -0.699798583984375, -0.67852783203125, -0.657257080078125, -0.635986328125, -0.614715576171875, -0.59344482421875, -0.572174072265625, -0.5509033203125, -0.529632568359375, -0.50836181640625, -0.487091064453125, -0.4658203125, -0.444549560546875, -0.42327880859375, -0.402008056640625, -0.3807373046875, -0.359466552734375, -0.33819580078125, -0.316925048828125, -0.295654296875, -0.274383544921875, -0.25311279296875, -0.231842041015625, -0.2105712890625, -0.189300537109375, -0.16802978515625, -0.146759033203125, -0.12548828125, -0.104217529296875, -0.08294677734375, -0.061676025390625, -0.0404052734375, -0.019134521484375, 0.00213623046875, 0.023406982421875, 0.044677734375, 0.065948486328125, 0.08721923828125, 0.108489990234375, 0.1297607421875, 0.151031494140625, 0.17230224609375, 0.193572998046875, 0.21484375, 0.236114501953125, 0.25738525390625, 0.278656005859375, 0.2999267578125, 0.321197509765625, 0.34246826171875, 0.363739013671875, 0.385009765625, 0.406280517578125, 0.42755126953125, 0.448822021484375, 0.4700927734375, 0.491363525390625, 0.51263427734375, 0.533905029296875, 0.55517578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 13.0, 8.0, 11.0, 14.0, 15.0, 26.0, 25.0, 30.0, 35.0, 36.0, 35.0, 54.0, 56.0, 59.0, 59.0, 59.0, 52.0, 55.0, 55.0, 49.0, 36.0, 39.0, 28.0, 25.0, 29.0, 20.0, 15.0, 17.0, 10.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.37890625, -0.3684959411621094, -0.35808563232421875, -0.3476753234863281, -0.3372650146484375, -0.3268547058105469, -0.31644439697265625, -0.3060340881347656, -0.295623779296875, -0.2852134704589844, -0.27480316162109375, -0.2643928527832031, -0.2539825439453125, -0.24357223510742188, -0.23316192626953125, -0.22275161743164062, -0.21234130859375, -0.20193099975585938, -0.19152069091796875, -0.18111038208007812, -0.1707000732421875, -0.16028976440429688, -0.14987945556640625, -0.13946914672851562, -0.129058837890625, -0.11864852905273438, -0.10823822021484375, -0.09782791137695312, -0.0874176025390625, -0.07700729370117188, -0.06659698486328125, -0.056186676025390625, -0.0457763671875, -0.035366058349609375, -0.02495574951171875, -0.014545440673828125, -0.0041351318359375, 0.006275177001953125, 0.01668548583984375, 0.027095794677734375, 0.037506103515625, 0.047916412353515625, 0.05832672119140625, 0.06873703002929688, 0.0791473388671875, 0.08955764770507812, 0.09996795654296875, 0.11037826538085938, 0.12078857421875, 0.13119888305664062, 0.14160919189453125, 0.15201950073242188, 0.1624298095703125, 0.17284011840820312, 0.18325042724609375, 0.19366073608398438, 0.204071044921875, 0.21448135375976562, 0.22489166259765625, 0.23530197143554688, 0.2457122802734375, 0.2561225891113281, 0.26653289794921875, 0.2769432067871094, 0.287353515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 15.0, 13.0, 26.0, 54.0, 73.0, 105.0, 213.0, 419.0, 1348.0, 6075.0, 68038.0, 928777.0, 36896.0, 4526.0, 1046.0, 382.0, 192.0, 109.0, 73.0, 54.0, 28.0, 17.0, 14.0, 9.0, 10.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6630859375, -1.613311767578125, -1.56353759765625, -1.513763427734375, -1.4639892578125, -1.414215087890625, -1.36444091796875, -1.314666748046875, -1.264892578125, -1.215118408203125, -1.16534423828125, -1.115570068359375, -1.0657958984375, -1.016021728515625, -0.96624755859375, -0.916473388671875, -0.86669921875, -0.816925048828125, -0.76715087890625, -0.717376708984375, -0.6676025390625, -0.617828369140625, -0.56805419921875, -0.518280029296875, -0.468505859375, -0.418731689453125, -0.36895751953125, -0.319183349609375, -0.2694091796875, -0.219635009765625, -0.16986083984375, -0.120086669921875, -0.0703125, -0.020538330078125, 0.02923583984375, 0.079010009765625, 0.1287841796875, 0.178558349609375, 0.22833251953125, 0.278106689453125, 0.327880859375, 0.377655029296875, 0.42742919921875, 0.477203369140625, 0.5269775390625, 0.576751708984375, 0.62652587890625, 0.676300048828125, 0.72607421875, 0.775848388671875, 0.82562255859375, 0.875396728515625, 0.9251708984375, 0.974945068359375, 1.02471923828125, 1.074493408203125, 1.124267578125, 1.174041748046875, 1.22381591796875, 1.273590087890625, 1.3233642578125, 1.373138427734375, 1.42291259765625, 1.472686767578125, 1.5224609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 2.0, 6.0, 12.0, 22.0, 32.0, 53.0, 57.0, 95.0, 99.0, 134.0, 125.0, 101.0, 83.0, 59.0, 35.0, 28.0, 10.0, 13.0, 12.0, 8.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.842613220214844e-05, -6.528012454509735e-05, -6.213411688804626e-05, -5.898810923099518e-05, -5.584210157394409e-05, -5.2696093916893005e-05, -4.955008625984192e-05, -4.640407860279083e-05, -4.3258070945739746e-05, -4.011206328868866e-05, -3.696605563163757e-05, -3.382004797458649e-05, -3.06740403175354e-05, -2.7528032660484314e-05, -2.4382025003433228e-05, -2.123601734638214e-05, -1.8090009689331055e-05, -1.4944002032279968e-05, -1.1797994375228882e-05, -8.651986718177795e-06, -5.505979061126709e-06, -2.3599714040756226e-06, 7.860362529754639e-07, 3.93204391002655e-06, 7.078051567077637e-06, 1.0224059224128723e-05, 1.337006688117981e-05, 1.6516074538230896e-05, 1.9662082195281982e-05, 2.280808985233307e-05, 2.5954097509384155e-05, 2.9100105166435242e-05, 3.224611282348633e-05, 3.5392120480537415e-05, 3.85381281375885e-05, 4.168413579463959e-05, 4.4830143451690674e-05, 4.797615110874176e-05, 5.112215876579285e-05, 5.426816642284393e-05, 5.741417407989502e-05, 6.0560181736946106e-05, 6.370618939399719e-05, 6.685219705104828e-05, 6.999820470809937e-05, 7.314421236515045e-05, 7.629022002220154e-05, 7.943622767925262e-05, 8.258223533630371e-05, 8.57282429933548e-05, 8.887425065040588e-05, 9.202025830745697e-05, 9.516626596450806e-05, 9.831227362155914e-05, 0.00010145828127861023, 0.00010460428893566132, 0.0001077502965927124, 0.00011089630424976349, 0.00011404231190681458, 0.00011718831956386566, 0.00012033432722091675, 0.00012348033487796783, 0.00012662634253501892, 0.00012977235019207, 0.0001329183578491211]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 5.0, 17.0, 29.0, 47.0, 68.0, 120.0, 247.0, 645.0, 1671.0, 6345.0, 45543.0, 856796.0, 123088.0, 10011.0, 2335.0, 833.0, 314.0, 171.0, 90.0, 53.0, 39.0, 20.0, 16.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.2192840576171875, -1.180755615234375, -1.1422271728515625, -1.10369873046875, -1.0651702880859375, -1.026641845703125, -0.9881134033203125, -0.9495849609375, -0.9110565185546875, -0.872528076171875, -0.8339996337890625, -0.79547119140625, -0.7569427490234375, -0.718414306640625, -0.6798858642578125, -0.641357421875, -0.6028289794921875, -0.564300537109375, -0.5257720947265625, -0.48724365234375, -0.4487152099609375, -0.410186767578125, -0.3716583251953125, -0.3331298828125, -0.2946014404296875, -0.256072998046875, -0.2175445556640625, -0.17901611328125, -0.1404876708984375, -0.101959228515625, -0.0634307861328125, -0.02490234375, 0.0136260986328125, 0.052154541015625, 0.0906829833984375, 0.12921142578125, 0.1677398681640625, 0.206268310546875, 0.2447967529296875, 0.2833251953125, 0.3218536376953125, 0.360382080078125, 0.3989105224609375, 0.43743896484375, 0.4759674072265625, 0.514495849609375, 0.5530242919921875, 0.591552734375, 0.6300811767578125, 0.668609619140625, 0.7071380615234375, 0.74566650390625, 0.7841949462890625, 0.822723388671875, 0.8612518310546875, 0.8997802734375, 0.9383087158203125, 0.976837158203125, 1.0153656005859375, 1.05389404296875, 1.0924224853515625, 1.130950927734375, 1.1694793701171875, 1.2080078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 7.0, 8.0, 15.0, 14.0, 32.0, 69.0, 83.0, 138.0, 165.0, 153.0, 125.0, 72.0, 52.0, 22.0, 13.0, 8.0, 3.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4154930114746094, -0.40007781982421875, -0.3846626281738281, -0.3692474365234375, -0.3538322448730469, -0.33841705322265625, -0.3230018615722656, -0.307586669921875, -0.2921714782714844, -0.27675628662109375, -0.2613410949707031, -0.2459259033203125, -0.23051071166992188, -0.21509552001953125, -0.19968032836914062, -0.18426513671875, -0.16884994506835938, -0.15343475341796875, -0.13801956176757812, -0.1226043701171875, -0.10718917846679688, -0.09177398681640625, -0.07635879516601562, -0.060943603515625, -0.045528411865234375, -0.03011322021484375, -0.014698028564453125, 0.0007171630859375, 0.016132354736328125, 0.03154754638671875, 0.046962738037109375, 0.0623779296875, 0.07779312133789062, 0.09320831298828125, 0.10862350463867188, 0.1240386962890625, 0.13945388793945312, 0.15486907958984375, 0.17028427124023438, 0.185699462890625, 0.20111465454101562, 0.21652984619140625, 0.23194503784179688, 0.2473602294921875, 0.2627754211425781, 0.27819061279296875, 0.2936058044433594, 0.30902099609375, 0.3244361877441406, 0.33985137939453125, 0.3552665710449219, 0.3706817626953125, 0.3860969543457031, 0.40151214599609375, 0.4169273376464844, 0.432342529296875, 0.4477577209472656, 0.46317291259765625, 0.4785881042480469, 0.4940032958984375, 0.5094184875488281, 0.5248336791992188, 0.5402488708496094, 0.5556640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 12.0, 46.0, 184.0, 423.0, 250.0, 67.0, 17.0, 10.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.70760726928711, -16.33279037475586, -15.957975387573242, -15.583159446716309, -15.208343505859375, -14.833527565002441, -14.458711624145508, -14.083895683288574, -13.70907974243164, -13.334263801574707, -12.959447860717773, -12.58463191986084, -12.209815979003906, -11.835000038146973, -11.460184097290039, -11.085368156433105, -10.710552215576172, -10.335736274719238, -9.960920333862305, -9.586104393005371, -9.211288452148438, -8.836472511291504, -8.46165657043457, -8.086840629577637, -7.712023735046387, -7.337207794189453, -6.9623918533325195, -6.587575912475586, -6.212759971618652, -5.837944030761719, -5.463128089904785, -5.088312149047852, -4.71349573135376, -4.338679790496826, -3.9638638496398926, -3.589047908782959, -3.2142319679260254, -2.839416027069092, -2.464599847793579, -2.0897839069366455, -1.714967966079712, -1.3401520252227783, -0.9653360247612, -0.5905200242996216, -0.215704083442688, 0.1591118574142456, 0.5339279174804688, 0.9087438583374023, 1.283559799194336, 1.6583757400512695, 2.033191680908203, 2.4080076217651367, 2.7828235626220703, 3.157639503479004, 3.5324556827545166, 3.90727162361145, 4.282087326049805, 4.656903266906738, 5.031719207763672, 5.4065351486206055, 5.781351089477539, 6.156167030334473, 6.530982971191406, 6.90579891204834, 7.280615329742432]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 14.0, 18.0, 17.0, 31.0, 34.0, 42.0, 46.0, 69.0, 69.0, 62.0, 65.0, 65.0, 82.0, 67.0, 54.0, 59.0, 43.0, 40.0, 34.0, 21.0, 17.0, 6.0, 15.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.159533977508545, -2.0684778690338135, -1.9774218797683716, -1.8863658905029297, -1.7953099012374878, -1.704253911972046, -1.6131978034973145, -1.5221418142318726, -1.4310858249664307, -1.3400298357009888, -1.2489737272262573, -1.1579177379608154, -1.0668617486953735, -0.9758056998252869, -0.8847496509552002, -0.7936936616897583, -0.7026375532150269, -0.6115815043449402, -0.5205255150794983, -0.4294694662094116, -0.33841344714164734, -0.24735742807388306, -0.1563013792037964, -0.06524538993835449, 0.025810658931732178, 0.11686668545007706, 0.20792271196842194, 0.2989787459373474, 0.3900347650051117, 0.481090784072876, 0.5721468329429626, 0.6632028222084045, 0.7542588710784912, 0.8453149199485779, 0.9363709092140198, 1.0274269580841064, 1.1184829473495483, 1.2095389366149902, 1.3005950450897217, 1.3916510343551636, 1.4827070236206055, 1.5737630128860474, 1.6648191213607788, 1.7558751106262207, 1.8469310998916626, 1.9379870891571045, 2.029043197631836, 2.1200990676879883, 2.211155414581299, 2.3022115230560303, 2.3932673931121826, 2.484323501586914, 2.5753796100616455, 2.666435480117798, 2.7574915885925293, 2.8485474586486816, 2.939603567123413, 3.0306596755981445, 3.121715545654297, 3.2127716541290283, 3.3038277626037598, 3.394883632659912, 3.4859397411346436, 3.576995849609375, 3.6680517196655273]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 12.0, 18.0, 32.0, 52.0, 99.0, 295.0, 999.0, 6401.0, 97757.0, 3993691.0, 87454.0, 5839.0, 962.0, 270.0, 118.0, 66.0, 42.0, 28.0, 22.0, 22.0, 19.0, 7.0, 11.0, 14.0, 5.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9638671875, -1.8897247314453125, -1.815582275390625, -1.7414398193359375, -1.66729736328125, -1.5931549072265625, -1.519012451171875, -1.4448699951171875, -1.3707275390625, -1.2965850830078125, -1.222442626953125, -1.1483001708984375, -1.07415771484375, -1.0000152587890625, -0.925872802734375, -0.8517303466796875, -0.777587890625, -0.7034454345703125, -0.629302978515625, -0.5551605224609375, -0.48101806640625, -0.4068756103515625, -0.332733154296875, -0.2585906982421875, -0.1844482421875, -0.1103057861328125, -0.036163330078125, 0.0379791259765625, 0.11212158203125, 0.1862640380859375, 0.260406494140625, 0.3345489501953125, 0.40869140625, 0.4828338623046875, 0.556976318359375, 0.6311187744140625, 0.70526123046875, 0.7794036865234375, 0.853546142578125, 0.9276885986328125, 1.0018310546875, 1.0759735107421875, 1.150115966796875, 1.2242584228515625, 1.29840087890625, 1.3725433349609375, 1.446685791015625, 1.5208282470703125, 1.594970703125, 1.6691131591796875, 1.743255615234375, 1.8173980712890625, 1.89154052734375, 1.9656829833984375, 2.039825439453125, 2.1139678955078125, 2.1881103515625, 2.2622528076171875, 2.336395263671875, 2.4105377197265625, 2.48468017578125, 2.5588226318359375, 2.632965087890625, 2.7071075439453125, 2.78125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 6.0, 9.0, 14.0, 10.0, 18.0, 15.0, 35.0, 37.0, 42.0, 53.0, 45.0, 51.0, 67.0, 48.0, 68.0, 69.0, 65.0, 74.0, 63.0, 43.0, 27.0, 34.0, 27.0, 17.0, 14.0, 10.0, 9.0, 9.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06072998046875, -0.0582275390625, -0.05572509765625, -0.05322265625, -0.05072021484375, -0.0482177734375, -0.04571533203125, -0.043212890625, -0.04071044921875, -0.0382080078125, -0.03570556640625, -0.033203125, -0.03070068359375, -0.0281982421875, -0.02569580078125, -0.023193359375, -0.02069091796875, -0.0181884765625, -0.01568603515625, -0.01318359375, -0.01068115234375, -0.0081787109375, -0.00567626953125, -0.003173828125, -0.00067138671875, 0.0018310546875, 0.00433349609375, 0.0068359375, 0.00933837890625, 0.0118408203125, 0.01434326171875, 0.016845703125, 0.01934814453125, 0.0218505859375, 0.02435302734375, 0.02685546875, 0.02935791015625, 0.0318603515625, 0.03436279296875, 0.036865234375, 0.03936767578125, 0.0418701171875, 0.04437255859375, 0.046875, 0.04937744140625, 0.0518798828125, 0.05438232421875, 0.056884765625, 0.05938720703125, 0.0618896484375, 0.06439208984375, 0.06689453125, 0.06939697265625, 0.0718994140625, 0.07440185546875, 0.076904296875, 0.07940673828125, 0.0819091796875, 0.08441162109375, 0.0869140625, 0.08941650390625, 0.0919189453125, 0.09442138671875, 0.096923828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 9.0, 8.0, 14.0, 28.0, 19.0, 38.0, 67.0, 129.0, 238.0, 505.0, 1730.0, 44189.0, 4138750.0, 6616.0, 1036.0, 410.0, 185.0, 105.0, 69.0, 53.0, 27.0, 16.0, 7.0, 10.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.125, -6.9525146484375, -6.780029296875, -6.6075439453125, -6.43505859375, -6.2625732421875, -6.090087890625, -5.9176025390625, -5.7451171875, -5.5726318359375, -5.400146484375, -5.2276611328125, -5.05517578125, -4.8826904296875, -4.710205078125, -4.5377197265625, -4.365234375, -4.1927490234375, -4.020263671875, -3.8477783203125, -3.67529296875, -3.5028076171875, -3.330322265625, -3.1578369140625, -2.9853515625, -2.8128662109375, -2.640380859375, -2.4678955078125, -2.29541015625, -2.1229248046875, -1.950439453125, -1.7779541015625, -1.60546875, -1.4329833984375, -1.260498046875, -1.0880126953125, -0.91552734375, -0.7430419921875, -0.570556640625, -0.3980712890625, -0.2255859375, -0.0531005859375, 0.119384765625, 0.2918701171875, 0.46435546875, 0.6368408203125, 0.809326171875, 0.9818115234375, 1.154296875, 1.3267822265625, 1.499267578125, 1.6717529296875, 1.84423828125, 2.0167236328125, 2.189208984375, 2.3616943359375, 2.5341796875, 2.7066650390625, 2.879150390625, 3.0516357421875, 3.22412109375, 3.3966064453125, 3.569091796875, 3.7415771484375, 3.9140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 16.0, 17.0, 40.0, 106.0, 252.0, 840.0, 2039.0, 434.0, 161.0, 78.0, 28.0, 21.0, 14.0, 11.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.4020957946777344, -0.38964080810546875, -0.3771858215332031, -0.3647308349609375, -0.3522758483886719, -0.33982086181640625, -0.3273658752441406, -0.314910888671875, -0.3024559020996094, -0.29000091552734375, -0.2775459289550781, -0.2650909423828125, -0.2526359558105469, -0.24018096923828125, -0.22772598266601562, -0.21527099609375, -0.20281600952148438, -0.19036102294921875, -0.17790603637695312, -0.1654510498046875, -0.15299606323242188, -0.14054107666015625, -0.12808609008789062, -0.115631103515625, -0.10317611694335938, -0.09072113037109375, -0.07826614379882812, -0.0658111572265625, -0.053356170654296875, -0.04090118408203125, -0.028446197509765625, -0.0159912109375, -0.003536224365234375, 0.00891876220703125, 0.021373748779296875, 0.0338287353515625, 0.046283721923828125, 0.05873870849609375, 0.07119369506835938, 0.083648681640625, 0.09610366821289062, 0.10855865478515625, 0.12101364135742188, 0.1334686279296875, 0.14592361450195312, 0.15837860107421875, 0.17083358764648438, 0.18328857421875, 0.19574356079101562, 0.20819854736328125, 0.22065353393554688, 0.2331085205078125, 0.24556350708007812, 0.25801849365234375, 0.2704734802246094, 0.282928466796875, 0.2953834533691406, 0.30783843994140625, 0.3202934265136719, 0.3327484130859375, 0.3452033996582031, 0.35765838623046875, 0.3701133728027344, 0.382568359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 16.0, 24.0, 39.0, 105.0, 197.0, 268.0, 182.0, 76.0, 40.0, 19.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7217984199523926, -3.6108174324035645, -3.4998362064361572, -3.388855218887329, -3.277873992919922, -3.1668930053710938, -3.0559120178222656, -2.9449307918548584, -2.833949565887451, -2.722968578338623, -2.611987352371216, -2.5010063648223877, -2.3900251388549805, -2.2790441513061523, -2.168063163757324, -2.057081937789917, -1.9461009502410889, -1.8351198434829712, -1.7241387367248535, -1.6131577491760254, -1.5021765232086182, -1.39119553565979, -1.2802144289016724, -1.1692333221435547, -1.058252215385437, -0.9472711086273193, -0.8362900018692017, -0.7253089547157288, -0.6143278479576111, -0.5033467411994934, -0.3923656940460205, -0.28138458728790283, -0.17040348052978516, -0.059422388672828674, 0.05155870318412781, 0.1625397801399231, 0.27352088689804077, 0.38450199365615845, 0.49548304080963135, 0.606464147567749, 0.7174452543258667, 0.8284263610839844, 0.939407467842102, 1.0503885746002197, 1.1613695621490479, 1.272350788116455, 1.3833317756652832, 1.4943128824234009, 1.6052939891815186, 1.7162750959396362, 1.827256202697754, 1.938237190246582, 2.0492184162139893, 2.1601994037628174, 2.2711806297302246, 2.3821616172790527, 2.493142604827881, 2.604123592376709, 2.715104818344116, 2.8260858058929443, 2.9370670318603516, 3.0480480194091797, 3.159029006958008, 3.270010232925415, 3.3809914588928223]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 13.0, 15.0, 17.0, 42.0, 36.0, 52.0, 67.0, 79.0, 93.0, 92.0, 67.0, 69.0, 63.0, 63.0, 60.0, 47.0, 34.0, 19.0, 19.0, 14.0, 10.0, 10.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.483320951461792, -1.447756290435791, -1.41219162940979, -1.3766270875930786, -1.3410624265670776, -1.3054977655410767, -1.2699332237243652, -1.2343685626983643, -1.1988039016723633, -1.1632392406463623, -1.1276745796203613, -1.09211003780365, -1.056545376777649, -1.020980715751648, -0.9854161143302917, -0.9498515129089355, -0.9142868518829346, -0.8787221908569336, -0.8431575894355774, -0.8075929880142212, -0.7720283269882202, -0.7364636659622192, -0.700899064540863, -0.6653344631195068, -0.6297698020935059, -0.5942051410675049, -0.5586405396461487, -0.5230759382247925, -0.4875112771987915, -0.4519466459751129, -0.4163820147514343, -0.38081738352775574, -0.34525275230407715, -0.30968812108039856, -0.27412348985671997, -0.23855885863304138, -0.2029942274093628, -0.1674295961856842, -0.13186496496200562, -0.09630033373832703, -0.06073570251464844, -0.02517107129096985, 0.01039355993270874, 0.04595819115638733, 0.08152282238006592, 0.1170874536037445, 0.1526520848274231, 0.18821671605110168, 0.22378134727478027, 0.25934597849845886, 0.29491060972213745, 0.33047524094581604, 0.36603987216949463, 0.4016045033931732, 0.4371691346168518, 0.4727337658405304, 0.508298397064209, 0.54386305809021, 0.5794276595115662, 0.6149922609329224, 0.6505569219589233, 0.6861215829849243, 0.7216861844062805, 0.7572507858276367, 0.7928154468536377]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 11.0, 8.0, 12.0, 19.0, 26.0, 17.0, 48.0, 53.0, 69.0, 102.0, 159.0, 282.0, 645.0, 1408.0, 4808.0, 25801.0, 259866.0, 649973.0, 89064.0, 11415.0, 2633.0, 978.0, 438.0, 238.0, 145.0, 92.0, 57.0, 51.0, 28.0, 25.0, 20.0, 9.0, 7.0, 10.0, 9.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.6005859375, -1.552490234375, -1.50439453125, -1.456298828125, -1.408203125, -1.360107421875, -1.31201171875, -1.263916015625, -1.2158203125, -1.167724609375, -1.11962890625, -1.071533203125, -1.0234375, -0.975341796875, -0.92724609375, -0.879150390625, -0.8310546875, -0.782958984375, -0.73486328125, -0.686767578125, -0.638671875, -0.590576171875, -0.54248046875, -0.494384765625, -0.4462890625, -0.398193359375, -0.35009765625, -0.302001953125, -0.25390625, -0.205810546875, -0.15771484375, -0.109619140625, -0.0615234375, -0.013427734375, 0.03466796875, 0.082763671875, 0.130859375, 0.178955078125, 0.22705078125, 0.275146484375, 0.3232421875, 0.371337890625, 0.41943359375, 0.467529296875, 0.515625, 0.563720703125, 0.61181640625, 0.659912109375, 0.7080078125, 0.756103515625, 0.80419921875, 0.852294921875, 0.900390625, 0.948486328125, 0.99658203125, 1.044677734375, 1.0927734375, 1.140869140625, 1.18896484375, 1.237060546875, 1.28515625, 1.333251953125, 1.38134765625, 1.429443359375, 1.4775390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 9.0, 4.0, 13.0, 20.0, 23.0, 49.0, 35.0, 50.0, 68.0, 67.0, 87.0, 87.0, 80.0, 77.0, 72.0, 81.0, 56.0, 32.0, 27.0, 22.0, 17.0, 13.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0828857421875, -0.07953834533691406, -0.07619094848632812, -0.07284355163574219, -0.06949615478515625, -0.06614875793457031, -0.06280136108398438, -0.05945396423339844, -0.0561065673828125, -0.05275917053222656, -0.049411773681640625, -0.04606437683105469, -0.04271697998046875, -0.03936958312988281, -0.036022186279296875, -0.03267478942871094, -0.029327392578125, -0.025979995727539062, -0.022632598876953125, -0.019285202026367188, -0.01593780517578125, -0.012590408325195312, -0.009243011474609375, -0.0058956146240234375, -0.0025482177734375, 0.0007991790771484375, 0.004146575927734375, 0.0074939727783203125, 0.01084136962890625, 0.014188766479492188, 0.017536163330078125, 0.020883560180664062, 0.02423095703125, 0.027578353881835938, 0.030925750732421875, 0.03427314758300781, 0.03762054443359375, 0.04096794128417969, 0.044315338134765625, 0.04766273498535156, 0.0510101318359375, 0.05435752868652344, 0.057704925537109375, 0.06105232238769531, 0.06439971923828125, 0.06774711608886719, 0.07109451293945312, 0.07444190979003906, 0.077789306640625, 0.08113670349121094, 0.08448410034179688, 0.08783149719238281, 0.09117889404296875, 0.09452629089355469, 0.09787368774414062, 0.10122108459472656, 0.1045684814453125, 0.10791587829589844, 0.11126327514648438, 0.11461067199707031, 0.11795806884765625, 0.12130546569824219, 0.12465286254882812, 0.12800025939941406, 0.13134765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 10.0, 14.0, 27.0, 26.0, 51.0, 79.0, 119.0, 193.0, 395.0, 672.0, 1467.0, 3077.0, 7522.0, 23439.0, 92933.0, 351050.0, 402935.0, 119214.0, 29475.0, 8960.0, 3500.0, 1543.0, 781.0, 410.0, 229.0, 141.0, 81.0, 57.0, 37.0, 26.0, 23.0, 9.0, 13.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7990036010742188, -0.7762298583984375, -0.7534561157226562, -0.730682373046875, -0.7079086303710938, -0.6851348876953125, -0.6623611450195312, -0.63958740234375, -0.6168136596679688, -0.5940399169921875, -0.5712661743164062, -0.548492431640625, -0.5257186889648438, -0.5029449462890625, -0.48017120361328125, -0.4573974609375, -0.43462371826171875, -0.4118499755859375, -0.38907623291015625, -0.366302490234375, -0.34352874755859375, -0.3207550048828125, -0.29798126220703125, -0.27520751953125, -0.25243377685546875, -0.2296600341796875, -0.20688629150390625, -0.184112548828125, -0.16133880615234375, -0.1385650634765625, -0.11579132080078125, -0.093017578125, -0.07024383544921875, -0.0474700927734375, -0.02469635009765625, -0.001922607421875, 0.02085113525390625, 0.0436248779296875, 0.06639862060546875, 0.08917236328125, 0.11194610595703125, 0.1347198486328125, 0.15749359130859375, 0.180267333984375, 0.20304107666015625, 0.2258148193359375, 0.24858856201171875, 0.2713623046875, 0.29413604736328125, 0.3169097900390625, 0.33968353271484375, 0.362457275390625, 0.38523101806640625, 0.4080047607421875, 0.43077850341796875, 0.45355224609375, 0.47632598876953125, 0.4990997314453125, 0.5218734741210938, 0.544647216796875, 0.5674209594726562, 0.5901947021484375, 0.6129684448242188, 0.6357421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 7.0, 10.0, 14.0, 15.0, 18.0, 22.0, 32.0, 33.0, 38.0, 30.0, 34.0, 30.0, 47.0, 43.0, 49.0, 46.0, 49.0, 49.0, 51.0, 31.0, 31.0, 40.0, 35.0, 33.0, 17.0, 28.0, 24.0, 14.0, 19.0, 15.0, 12.0, 11.0, 9.0, 11.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.307373046875, -0.2979774475097656, -0.28858184814453125, -0.2791862487792969, -0.2697906494140625, -0.2603950500488281, -0.25099945068359375, -0.24160385131835938, -0.232208251953125, -0.22281265258789062, -0.21341705322265625, -0.20402145385742188, -0.1946258544921875, -0.18523025512695312, -0.17583465576171875, -0.16643905639648438, -0.15704345703125, -0.14764785766601562, -0.13825225830078125, -0.12885665893554688, -0.1194610595703125, -0.11006546020507812, -0.10066986083984375, -0.09127426147460938, -0.081878662109375, -0.07248306274414062, -0.06308746337890625, -0.053691864013671875, -0.0442962646484375, -0.034900665283203125, -0.02550506591796875, -0.016109466552734375, -0.0067138671875, 0.002681732177734375, 0.01207733154296875, 0.021472930908203125, 0.0308685302734375, 0.040264129638671875, 0.04965972900390625, 0.059055328369140625, 0.068450927734375, 0.07784652709960938, 0.08724212646484375, 0.09663772583007812, 0.1060333251953125, 0.11542892456054688, 0.12482452392578125, 0.13422012329101562, 0.14361572265625, 0.15301132202148438, 0.16240692138671875, 0.17180252075195312, 0.1811981201171875, 0.19059371948242188, 0.19998931884765625, 0.20938491821289062, 0.218780517578125, 0.22817611694335938, 0.23757171630859375, 0.24696731567382812, 0.2563629150390625, 0.2657585144042969, 0.27515411376953125, 0.2845497131347656, 0.2939453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 4.0, 4.0, 11.0, 14.0, 19.0, 24.0, 57.0, 77.0, 146.0, 279.0, 529.0, 1204.0, 3415.0, 12084.0, 88429.0, 700792.0, 212376.0, 20892.0, 4971.0, 1704.0, 709.0, 326.0, 164.0, 120.0, 53.0, 40.0, 22.0, 17.0, 15.0, 7.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6558837890625, -0.636962890625, -0.6180419921875, -0.59912109375, -0.5802001953125, -0.561279296875, -0.5423583984375, -0.5234375, -0.5045166015625, -0.485595703125, -0.4666748046875, -0.44775390625, -0.4288330078125, -0.409912109375, -0.3909912109375, -0.3720703125, -0.3531494140625, -0.334228515625, -0.3153076171875, -0.29638671875, -0.2774658203125, -0.258544921875, -0.2396240234375, -0.220703125, -0.2017822265625, -0.182861328125, -0.1639404296875, -0.14501953125, -0.1260986328125, -0.107177734375, -0.0882568359375, -0.0693359375, -0.0504150390625, -0.031494140625, -0.0125732421875, 0.00634765625, 0.0252685546875, 0.044189453125, 0.0631103515625, 0.08203125, 0.1009521484375, 0.119873046875, 0.1387939453125, 0.15771484375, 0.1766357421875, 0.195556640625, 0.2144775390625, 0.2333984375, 0.2523193359375, 0.271240234375, 0.2901611328125, 0.30908203125, 0.3280029296875, 0.346923828125, 0.3658447265625, 0.384765625, 0.4036865234375, 0.422607421875, 0.4415283203125, 0.46044921875, 0.4793701171875, 0.498291015625, 0.5172119140625, 0.5361328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 11.0, 9.0, 17.0, 16.0, 19.0, 29.0, 31.0, 42.0, 49.0, 64.0, 75.0, 83.0, 104.0, 67.0, 78.0, 54.0, 61.0, 41.0, 36.0, 25.0, 26.0, 11.0, 9.0, 7.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.210803985595703e-05, -6.0187652707099915e-05, -5.82672655582428e-05, -5.634687840938568e-05, -5.4426491260528564e-05, -5.250610411167145e-05, -5.058571696281433e-05, -4.8665329813957214e-05, -4.67449426651001e-05, -4.482455551624298e-05, -4.2904168367385864e-05, -4.098378121852875e-05, -3.906339406967163e-05, -3.7143006920814514e-05, -3.52226197719574e-05, -3.330223262310028e-05, -3.1381845474243164e-05, -2.9461458325386047e-05, -2.754107117652893e-05, -2.5620684027671814e-05, -2.3700296878814697e-05, -2.177990972995758e-05, -1.9859522581100464e-05, -1.7939135432243347e-05, -1.601874828338623e-05, -1.4098361134529114e-05, -1.2177973985671997e-05, -1.025758683681488e-05, -8.337199687957764e-06, -6.416812539100647e-06, -4.49642539024353e-06, -2.5760382413864136e-06, -6.556510925292969e-07, 1.2647360563278198e-06, 3.1851232051849365e-06, 5.105510354042053e-06, 7.02589750289917e-06, 8.946284651756287e-06, 1.0866671800613403e-05, 1.278705894947052e-05, 1.4707446098327637e-05, 1.6627833247184753e-05, 1.854822039604187e-05, 2.0468607544898987e-05, 2.2388994693756104e-05, 2.430938184261322e-05, 2.6229768991470337e-05, 2.8150156140327454e-05, 3.007054328918457e-05, 3.199093043804169e-05, 3.3911317586898804e-05, 3.583170473575592e-05, 3.775209188461304e-05, 3.9672479033470154e-05, 4.159286618232727e-05, 4.351325333118439e-05, 4.5433640480041504e-05, 4.735402762889862e-05, 4.927441477775574e-05, 5.1194801926612854e-05, 5.311518907546997e-05, 5.503557622432709e-05, 5.6955963373184204e-05, 5.887635052204132e-05, 6.079673767089844e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 5.0, 11.0, 13.0, 17.0, 12.0, 27.0, 54.0, 82.0, 154.0, 274.0, 586.0, 1381.0, 3486.0, 11839.0, 60879.0, 570322.0, 350703.0, 35644.0, 8227.0, 2725.0, 1065.0, 489.0, 239.0, 107.0, 79.0, 40.0, 30.0, 16.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7109375, -0.6939544677734375, -0.676971435546875, -0.6599884033203125, -0.64300537109375, -0.6260223388671875, -0.609039306640625, -0.5920562744140625, -0.5750732421875, -0.5580902099609375, -0.541107177734375, -0.5241241455078125, -0.50714111328125, -0.4901580810546875, -0.473175048828125, -0.4561920166015625, -0.439208984375, -0.4222259521484375, -0.405242919921875, -0.3882598876953125, -0.37127685546875, -0.3542938232421875, -0.337310791015625, -0.3203277587890625, -0.3033447265625, -0.2863616943359375, -0.269378662109375, -0.2523956298828125, -0.23541259765625, -0.2184295654296875, -0.201446533203125, -0.1844635009765625, -0.16748046875, -0.1504974365234375, -0.133514404296875, -0.1165313720703125, -0.09954833984375, -0.0825653076171875, -0.065582275390625, -0.0485992431640625, -0.0316162109375, -0.0146331787109375, 0.002349853515625, 0.0193328857421875, 0.03631591796875, 0.0532989501953125, 0.070281982421875, 0.0872650146484375, 0.104248046875, 0.1212310791015625, 0.138214111328125, 0.1551971435546875, 0.17218017578125, 0.1891632080078125, 0.206146240234375, 0.2231292724609375, 0.2401123046875, 0.2570953369140625, 0.274078369140625, 0.2910614013671875, 0.30804443359375, 0.3250274658203125, 0.342010498046875, 0.3589935302734375, 0.3759765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 16.0, 22.0, 19.0, 71.0, 69.0, 84.0, 116.0, 136.0, 119.0, 119.0, 63.0, 47.0, 34.0, 35.0, 8.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4656867980957031, -0.45334625244140625, -0.4410057067871094, -0.4286651611328125, -0.4163246154785156, -0.40398406982421875, -0.3916435241699219, -0.379302978515625, -0.3669624328613281, -0.35462188720703125, -0.3422813415527344, -0.3299407958984375, -0.3176002502441406, -0.30525970458984375, -0.2929191589355469, -0.28057861328125, -0.2682380676269531, -0.25589752197265625, -0.24355697631835938, -0.2312164306640625, -0.21887588500976562, -0.20653533935546875, -0.19419479370117188, -0.181854248046875, -0.16951370239257812, -0.15717315673828125, -0.14483261108398438, -0.1324920654296875, -0.12015151977539062, -0.10781097412109375, -0.09547042846679688, -0.0831298828125, -0.07078933715820312, -0.05844879150390625, -0.046108245849609375, -0.0337677001953125, -0.021427154541015625, -0.00908660888671875, 0.003253936767578125, 0.015594482421875, 0.027935028076171875, 0.04027557373046875, 0.052616119384765625, 0.0649566650390625, 0.07729721069335938, 0.08963775634765625, 0.10197830200195312, 0.11431884765625, 0.12665939331054688, 0.13899993896484375, 0.15134048461914062, 0.1636810302734375, 0.17602157592773438, 0.18836212158203125, 0.20070266723632812, 0.213043212890625, 0.22538375854492188, 0.23772430419921875, 0.2500648498535156, 0.2624053955078125, 0.2747459411621094, 0.28708648681640625, 0.2994270324707031, 0.311767578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 14.0, 33.0, 80.0, 148.0, 250.0, 246.0, 126.0, 56.0, 28.0, 11.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.672994136810303, -6.440582275390625, -6.2081708908081055, -5.975759029388428, -5.74334716796875, -5.5109357833862305, -5.278523921966553, -5.046112060546875, -4.8137006759643555, -4.581288814544678, -4.348877429962158, -4.1164655685424805, -3.8840537071228027, -3.651642084121704, -3.4192304611206055, -3.1868185997009277, -2.95440673828125, -2.7219951152801514, -2.4895832538604736, -2.257171630859375, -2.0247597694396973, -1.7923481464385986, -1.5599365234375, -1.3275247812271118, -1.0951130390167236, -0.8627012968063354, -0.630289614200592, -0.39787793159484863, -0.16546618938446045, 0.06694555282592773, 0.29935717582702637, 0.5317689180374146, 0.7641811370849609, 0.9965928792953491, 1.2290046215057373, 1.461416244506836, 1.6938279867172241, 1.9262397289276123, 2.158651351928711, 2.3910632133483887, 2.6234748363494873, 2.855886459350586, 3.0882983207702637, 3.3207099437713623, 3.553121566772461, 3.7855334281921387, 4.017945289611816, 4.250356674194336, 4.482768535614014, 4.715180397033691, 4.947591781616211, 5.180003643035889, 5.412415504455566, 5.644826889038086, 5.877238750457764, 6.109650611877441, 6.342061996459961, 6.574473857879639, 6.806885242462158, 7.039297103881836, 7.271708965301514, 7.504120826721191, 7.736532211303711, 7.968944072723389, 8.201355934143066]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 8.0, 12.0, 12.0, 15.0, 15.0, 19.0, 28.0, 31.0, 30.0, 33.0, 46.0, 32.0, 48.0, 48.0, 39.0, 37.0, 42.0, 33.0, 37.0, 41.0, 37.0, 38.0, 32.0, 43.0, 30.0, 29.0, 25.0, 20.0, 18.0, 17.0, 19.0, 11.0, 9.0, 16.0, 5.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.741559386253357, -1.685322642326355, -1.629085898399353, -1.572849154472351, -1.5166124105453491, -1.4603756666183472, -1.4041389226913452, -1.3479021787643433, -1.2916654348373413, -1.2354286909103394, -1.1791919469833374, -1.1229552030563354, -1.0667184591293335, -1.0104817152023315, -0.9542449712753296, -0.8980082273483276, -0.8417714834213257, -0.7855347394943237, -0.7292979955673218, -0.6730612516403198, -0.6168245077133179, -0.5605877637863159, -0.504351019859314, -0.448114275932312, -0.39187753200531006, -0.3356407880783081, -0.27940404415130615, -0.2231673002243042, -0.16693055629730225, -0.11069381237030029, -0.05445706844329834, 0.0017796754837036133, 0.058016300201416016, 0.11425304412841797, 0.17048978805541992, 0.22672653198242188, 0.28296327590942383, 0.3392000198364258, 0.39543676376342773, 0.4516735076904297, 0.5079102516174316, 0.5641469955444336, 0.6203837394714355, 0.6766204833984375, 0.7328572273254395, 0.7890939712524414, 0.8453307151794434, 0.9015674591064453, 0.9578042030334473, 1.0140409469604492, 1.0702776908874512, 1.1265144348144531, 1.182751178741455, 1.238987922668457, 1.295224666595459, 1.351461410522461, 1.407698154449463, 1.4639348983764648, 1.5201716423034668, 1.5764083862304688, 1.6326451301574707, 1.6888818740844727, 1.7451186180114746, 1.8013553619384766, 1.8575921058654785]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 11.0, 22.0, 24.0, 46.0, 78.0, 140.0, 266.0, 552.0, 1502.0, 5666.0, 42920.0, 3859616.0, 265021.0, 13832.0, 2841.0, 872.0, 372.0, 180.0, 97.0, 46.0, 40.0, 18.0, 25.0, 13.0, 13.0, 7.0, 3.0, 8.0, 6.0, 8.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5263671875, -1.4621124267578125, -1.397857666015625, -1.3336029052734375, -1.26934814453125, -1.2050933837890625, -1.140838623046875, -1.0765838623046875, -1.0123291015625, -0.9480743408203125, -0.883819580078125, -0.8195648193359375, -0.75531005859375, -0.6910552978515625, -0.626800537109375, -0.5625457763671875, -0.498291015625, -0.4340362548828125, -0.369781494140625, -0.3055267333984375, -0.24127197265625, -0.1770172119140625, -0.112762451171875, -0.0485076904296875, 0.0157470703125, 0.0800018310546875, 0.144256591796875, 0.2085113525390625, 0.27276611328125, 0.3370208740234375, 0.401275634765625, 0.4655303955078125, 0.52978515625, 0.5940399169921875, 0.658294677734375, 0.7225494384765625, 0.78680419921875, 0.8510589599609375, 0.915313720703125, 0.9795684814453125, 1.0438232421875, 1.1080780029296875, 1.172332763671875, 1.2365875244140625, 1.30084228515625, 1.3650970458984375, 1.429351806640625, 1.4936065673828125, 1.557861328125, 1.6221160888671875, 1.686370849609375, 1.7506256103515625, 1.81488037109375, 1.8791351318359375, 1.943389892578125, 2.0076446533203125, 2.0718994140625, 2.1361541748046875, 2.200408935546875, 2.2646636962890625, 2.32891845703125, 2.3931732177734375, 2.457427978515625, 2.5216827392578125, 2.5859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 2.0, 5.0, 9.0, 14.0, 17.0, 25.0, 27.0, 23.0, 65.0, 64.0, 66.0, 63.0, 78.0, 87.0, 71.0, 78.0, 55.0, 59.0, 47.0, 43.0, 21.0, 20.0, 22.0, 9.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07489967346191406, -0.07155227661132812, -0.06820487976074219, -0.06485748291015625, -0.06151008605957031, -0.058162689208984375, -0.05481529235839844, -0.0514678955078125, -0.04812049865722656, -0.044773101806640625, -0.04142570495605469, -0.03807830810546875, -0.03473091125488281, -0.031383514404296875, -0.028036117553710938, -0.024688720703125, -0.021341323852539062, -0.017993927001953125, -0.014646530151367188, -0.01129913330078125, -0.007951736450195312, -0.004604339599609375, -0.0012569427490234375, 0.0020904541015625, 0.0054378509521484375, 0.008785247802734375, 0.012132644653320312, 0.01548004150390625, 0.018827438354492188, 0.022174835205078125, 0.025522232055664062, 0.02886962890625, 0.03221702575683594, 0.035564422607421875, 0.03891181945800781, 0.04225921630859375, 0.04560661315917969, 0.048954010009765625, 0.05230140686035156, 0.0556488037109375, 0.05899620056152344, 0.062343597412109375, 0.06569099426269531, 0.06903839111328125, 0.07238578796386719, 0.07573318481445312, 0.07908058166503906, 0.082427978515625, 0.08577537536621094, 0.08912277221679688, 0.09247016906738281, 0.09581756591796875, 0.09916496276855469, 0.10251235961914062, 0.10585975646972656, 0.1092071533203125, 0.11255455017089844, 0.11590194702148438, 0.11924934387207031, 0.12259674072265625, 0.1259441375732422, 0.12929153442382812, 0.13263893127441406, 0.135986328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 10.0, 17.0, 35.0, 41.0, 83.0, 182.0, 385.0, 1173.0, 6971.0, 1667375.0, 2507908.0, 7943.0, 1321.0, 485.0, 193.0, 84.0, 36.0, 22.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.123138427734375, -3.02557373046875, -2.928009033203125, -2.8304443359375, -2.732879638671875, -2.63531494140625, -2.537750244140625, -2.440185546875, -2.342620849609375, -2.24505615234375, -2.147491455078125, -2.0499267578125, -1.952362060546875, -1.85479736328125, -1.757232666015625, -1.65966796875, -1.562103271484375, -1.46453857421875, -1.366973876953125, -1.2694091796875, -1.171844482421875, -1.07427978515625, -0.976715087890625, -0.879150390625, -0.781585693359375, -0.68402099609375, -0.586456298828125, -0.4888916015625, -0.391326904296875, -0.29376220703125, -0.196197509765625, -0.0986328125, -0.001068115234375, 0.09649658203125, 0.194061279296875, 0.2916259765625, 0.389190673828125, 0.48675537109375, 0.584320068359375, 0.681884765625, 0.779449462890625, 0.87701416015625, 0.974578857421875, 1.0721435546875, 1.169708251953125, 1.26727294921875, 1.364837646484375, 1.46240234375, 1.559967041015625, 1.65753173828125, 1.755096435546875, 1.8526611328125, 1.950225830078125, 2.04779052734375, 2.145355224609375, 2.242919921875, 2.340484619140625, 2.43804931640625, 2.535614013671875, 2.6331787109375, 2.730743408203125, 2.82830810546875, 2.925872802734375, 3.0234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 10.0, 18.0, 28.0, 52.0, 146.0, 461.0, 2084.0, 894.0, 222.0, 87.0, 29.0, 23.0, 10.0, 7.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452880859375, -0.4390411376953125, -0.425201416015625, -0.4113616943359375, -0.39752197265625, -0.3836822509765625, -0.369842529296875, -0.3560028076171875, -0.3421630859375, -0.3283233642578125, -0.314483642578125, -0.3006439208984375, -0.28680419921875, -0.2729644775390625, -0.259124755859375, -0.2452850341796875, -0.2314453125, -0.2176055908203125, -0.203765869140625, -0.1899261474609375, -0.17608642578125, -0.1622467041015625, -0.148406982421875, -0.1345672607421875, -0.1207275390625, -0.1068878173828125, -0.093048095703125, -0.0792083740234375, -0.06536865234375, -0.0515289306640625, -0.037689208984375, -0.0238494873046875, -0.010009765625, 0.0038299560546875, 0.017669677734375, 0.0315093994140625, 0.04534912109375, 0.0591888427734375, 0.073028564453125, 0.0868682861328125, 0.1007080078125, 0.1145477294921875, 0.128387451171875, 0.1422271728515625, 0.15606689453125, 0.1699066162109375, 0.183746337890625, 0.1975860595703125, 0.21142578125, 0.2252655029296875, 0.239105224609375, 0.2529449462890625, 0.26678466796875, 0.2806243896484375, 0.294464111328125, 0.3083038330078125, 0.3221435546875, 0.3359832763671875, 0.349822998046875, 0.3636627197265625, 0.37750244140625, 0.3913421630859375, 0.405181884765625, 0.4190216064453125, 0.432861328125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 14.0, 40.0, 130.0, 396.0, 308.0, 83.0, 21.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.397743225097656, -4.250485897064209, -4.10322904586792, -3.9559717178344727, -3.8087146282196045, -3.6614575386047363, -3.514200210571289, -3.366943120956421, -3.2196860313415527, -3.0724289417266846, -2.9251718521118164, -2.777914524078369, -2.630657434463501, -2.483400344848633, -2.3361430168151855, -2.1888859272003174, -2.041628837585449, -1.894371747970581, -1.7471145391464233, -1.5998573303222656, -1.4526002407073975, -1.3053431510925293, -1.1580859422683716, -1.0108287334442139, -0.8635716438293457, -0.7163144946098328, -0.5690573453903198, -0.4218001961708069, -0.27454304695129395, -0.127285897731781, 0.019971251487731934, 0.16722846031188965, 0.3144855499267578, 0.46174269914627075, 0.6089998483657837, 0.7562569975852966, 0.9035141468048096, 1.0507712364196777, 1.1980284452438354, 1.3452856540679932, 1.4925427436828613, 1.6397998332977295, 1.7870570421218872, 1.934314250946045, 2.081571340560913, 2.2288284301757812, 2.3760857582092285, 2.5233428478240967, 2.670599937438965, 2.817857027053833, 2.965114116668701, 3.1123714447021484, 3.2596285343170166, 3.4068856239318848, 3.554142951965332, 3.7014000415802, 3.8486571311950684, 3.9959142208099365, 4.143171310424805, 4.290428638458252, 4.437685966491699, 4.584942817687988, 4.7322001457214355, 4.879457473754883, 5.026714324951172]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 7.0, 18.0, 10.0, 15.0, 23.0, 23.0, 36.0, 35.0, 59.0, 62.0, 48.0, 64.0, 59.0, 63.0, 75.0, 64.0, 60.0, 50.0, 49.0, 37.0, 27.0, 15.0, 20.0, 11.0, 17.0, 8.0, 4.0, 9.0, 4.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8421344757080078, -0.8111727237701416, -0.7802109718322754, -0.7492492198944092, -0.718287467956543, -0.6873257160186768, -0.6563639640808105, -0.6254022121429443, -0.5944404602050781, -0.5634787082672119, -0.5325169563293457, -0.5015552043914795, -0.4705934524536133, -0.43963170051574707, -0.40866991877555847, -0.37770816683769226, -0.34674638509750366, -0.31578463315963745, -0.28482288122177124, -0.25386112928390503, -0.22289936244487762, -0.1919376105070114, -0.160975843667984, -0.1300140917301178, -0.09905233979225159, -0.06809058785438538, -0.03712882846593857, -0.00616706907749176, 0.02479468286037445, 0.05575643479824066, 0.08671820163726807, 0.11767995357513428, 0.1486417055130005, 0.1796034574508667, 0.2105652093887329, 0.24152697622776031, 0.27248871326446533, 0.30345046520233154, 0.33441224694252014, 0.36537399888038635, 0.39633575081825256, 0.4272975027561188, 0.458259254693985, 0.4892210364341736, 0.5201827883720398, 0.551144540309906, 0.5821062922477722, 0.6130680441856384, 0.6440297961235046, 0.6749915480613708, 0.7059532999992371, 0.7369150519371033, 0.7678768038749695, 0.7988385558128357, 0.8298003673553467, 0.8607621192932129, 0.8917238712310791, 0.9226856231689453, 0.9536473751068115, 0.9846091270446777, 1.015570878982544, 1.0465326309204102, 1.0774943828582764, 1.1084561347961426, 1.1394178867340088]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 3.0, 10.0, 18.0, 45.0, 73.0, 139.0, 322.0, 796.0, 2472.0, 20680.0, 764890.0, 249036.0, 7604.0, 1450.0, 529.0, 224.0, 104.0, 60.0, 29.0, 20.0, 9.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.181640625, -2.09002685546875, -1.9984130859375, -1.90679931640625, -1.815185546875, -1.72357177734375, -1.6319580078125, -1.54034423828125, -1.44873046875, -1.35711669921875, -1.2655029296875, -1.17388916015625, -1.082275390625, -0.99066162109375, -0.8990478515625, -0.80743408203125, -0.7158203125, -0.62420654296875, -0.5325927734375, -0.44097900390625, -0.349365234375, -0.25775146484375, -0.1661376953125, -0.07452392578125, 0.01708984375, 0.10870361328125, 0.2003173828125, 0.29193115234375, 0.383544921875, 0.47515869140625, 0.5667724609375, 0.65838623046875, 0.75, 0.84161376953125, 0.9332275390625, 1.02484130859375, 1.116455078125, 1.20806884765625, 1.2996826171875, 1.39129638671875, 1.48291015625, 1.57452392578125, 1.6661376953125, 1.75775146484375, 1.849365234375, 1.94097900390625, 2.0325927734375, 2.12420654296875, 2.2158203125, 2.30743408203125, 2.3990478515625, 2.49066162109375, 2.582275390625, 2.67388916015625, 2.7655029296875, 2.85711669921875, 2.94873046875, 3.04034423828125, 3.1319580078125, 3.22357177734375, 3.315185546875, 3.40679931640625, 3.4984130859375, 3.59002685546875, 3.681640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 17.0, 25.0, 20.0, 30.0, 33.0, 49.0, 48.0, 63.0, 69.0, 75.0, 72.0, 71.0, 71.0, 65.0, 61.0, 48.0, 39.0, 23.0, 19.0, 27.0, 12.0, 12.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08433341979980469, -0.08077621459960938, -0.07721900939941406, -0.07366180419921875, -0.07010459899902344, -0.06654739379882812, -0.06299018859863281, -0.0594329833984375, -0.05587577819824219, -0.052318572998046875, -0.04876136779785156, -0.04520416259765625, -0.04164695739746094, -0.038089752197265625, -0.03453254699707031, -0.030975341796875, -0.027418136596679688, -0.023860931396484375, -0.020303726196289062, -0.01674652099609375, -0.013189315795898438, -0.009632110595703125, -0.0060749053955078125, -0.0025177001953125, 0.0010395050048828125, 0.004596710205078125, 0.008153915405273438, 0.01171112060546875, 0.015268325805664062, 0.018825531005859375, 0.022382736206054688, 0.02593994140625, 0.029497146606445312, 0.033054351806640625, 0.03661155700683594, 0.04016876220703125, 0.04372596740722656, 0.047283172607421875, 0.05084037780761719, 0.0543975830078125, 0.05795478820800781, 0.061511993408203125, 0.06506919860839844, 0.06862640380859375, 0.07218360900878906, 0.07574081420898438, 0.07929801940917969, 0.082855224609375, 0.08641242980957031, 0.08996963500976562, 0.09352684020996094, 0.09708404541015625, 0.10064125061035156, 0.10419845581054688, 0.10775566101074219, 0.1113128662109375, 0.11487007141113281, 0.11842727661132812, 0.12198448181152344, 0.12554168701171875, 0.12909889221191406, 0.13265609741210938, 0.1362133026123047, 0.1397705078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 12.0, 10.0, 7.0, 21.0, 24.0, 31.0, 41.0, 68.0, 92.0, 152.0, 254.0, 373.0, 759.0, 1238.0, 2514.0, 5655.0, 15695.0, 58450.0, 260037.0, 477039.0, 167663.0, 38127.0, 11312.0, 4277.0, 2055.0, 1083.0, 575.0, 366.0, 197.0, 130.0, 92.0, 45.0, 40.0, 29.0, 18.0, 12.0, 14.0, 3.0, 12.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8632736206054688, -0.8373870849609375, -0.8115005493164062, -0.785614013671875, -0.7597274780273438, -0.7338409423828125, -0.7079544067382812, -0.68206787109375, -0.6561813354492188, -0.6302947998046875, -0.6044082641601562, -0.578521728515625, -0.5526351928710938, -0.5267486572265625, -0.5008621215820312, -0.4749755859375, -0.44908905029296875, -0.4232025146484375, -0.39731597900390625, -0.371429443359375, -0.34554290771484375, -0.3196563720703125, -0.29376983642578125, -0.26788330078125, -0.24199676513671875, -0.2161102294921875, -0.19022369384765625, -0.164337158203125, -0.13845062255859375, -0.1125640869140625, -0.08667755126953125, -0.060791015625, -0.03490447998046875, -0.0090179443359375, 0.01686859130859375, 0.042755126953125, 0.06864166259765625, 0.0945281982421875, 0.12041473388671875, 0.14630126953125, 0.17218780517578125, 0.1980743408203125, 0.22396087646484375, 0.249847412109375, 0.27573394775390625, 0.3016204833984375, 0.32750701904296875, 0.3533935546875, 0.37928009033203125, 0.4051666259765625, 0.43105316162109375, 0.456939697265625, 0.48282623291015625, 0.5087127685546875, 0.5345993041992188, 0.56048583984375, 0.5863723754882812, 0.6122589111328125, 0.6381454467773438, 0.664031982421875, 0.6899185180664062, 0.7158050537109375, 0.7416915893554688, 0.767578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 10.0, 11.0, 10.0, 11.0, 15.0, 17.0, 20.0, 22.0, 22.0, 21.0, 32.0, 35.0, 40.0, 36.0, 46.0, 43.0, 50.0, 47.0, 38.0, 47.0, 42.0, 46.0, 43.0, 34.0, 38.0, 21.0, 25.0, 28.0, 25.0, 18.0, 15.0, 14.0, 12.0, 12.0, 8.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.423095703125, -0.41040802001953125, -0.3977203369140625, -0.38503265380859375, -0.372344970703125, -0.35965728759765625, -0.3469696044921875, -0.33428192138671875, -0.32159423828125, -0.30890655517578125, -0.2962188720703125, -0.28353118896484375, -0.270843505859375, -0.25815582275390625, -0.2454681396484375, -0.23278045654296875, -0.2200927734375, -0.20740509033203125, -0.1947174072265625, -0.18202972412109375, -0.169342041015625, -0.15665435791015625, -0.1439666748046875, -0.13127899169921875, -0.11859130859375, -0.10590362548828125, -0.0932159423828125, -0.08052825927734375, -0.067840576171875, -0.05515289306640625, -0.0424652099609375, -0.02977752685546875, -0.01708984375, -0.00440216064453125, 0.0082855224609375, 0.02097320556640625, 0.033660888671875, 0.04634857177734375, 0.0590362548828125, 0.07172393798828125, 0.08441162109375, 0.09709930419921875, 0.1097869873046875, 0.12247467041015625, 0.135162353515625, 0.14785003662109375, 0.1605377197265625, 0.17322540283203125, 0.1859130859375, 0.19860076904296875, 0.2112884521484375, 0.22397613525390625, 0.236663818359375, 0.24935150146484375, 0.2620391845703125, 0.27472686767578125, 0.28741455078125, 0.30010223388671875, 0.3127899169921875, 0.32547760009765625, 0.338165283203125, 0.35085296630859375, 0.3635406494140625, 0.37622833251953125, 0.388916015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 10.0, 16.0, 24.0, 34.0, 40.0, 93.0, 115.0, 191.0, 264.0, 473.0, 939.0, 2061.0, 5175.0, 16556.0, 78215.0, 430139.0, 415378.0, 73703.0, 15822.0, 4982.0, 2061.0, 951.0, 503.0, 290.0, 167.0, 115.0, 66.0, 40.0, 37.0, 18.0, 19.0, 9.0, 6.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4302253723144531, -0.41538238525390625, -0.4005393981933594, -0.3856964111328125, -0.3708534240722656, -0.35601043701171875, -0.3411674499511719, -0.326324462890625, -0.3114814758300781, -0.29663848876953125, -0.2817955017089844, -0.2669525146484375, -0.2521095275878906, -0.23726654052734375, -0.22242355346679688, -0.20758056640625, -0.19273757934570312, -0.17789459228515625, -0.16305160522460938, -0.1482086181640625, -0.13336563110351562, -0.11852264404296875, -0.10367965698242188, -0.088836669921875, -0.07399368286132812, -0.05915069580078125, -0.044307708740234375, -0.0294647216796875, -0.014621734619140625, 0.00022125244140625, 0.015064239501953125, 0.0299072265625, 0.044750213623046875, 0.05959320068359375, 0.07443618774414062, 0.0892791748046875, 0.10412216186523438, 0.11896514892578125, 0.13380813598632812, 0.148651123046875, 0.16349411010742188, 0.17833709716796875, 0.19318008422851562, 0.2080230712890625, 0.22286605834960938, 0.23770904541015625, 0.2525520324707031, 0.26739501953125, 0.2822380065917969, 0.29708099365234375, 0.3119239807128906, 0.3267669677734375, 0.3416099548339844, 0.35645294189453125, 0.3712959289550781, 0.386138916015625, 0.4009819030761719, 0.41582489013671875, 0.4306678771972656, 0.4455108642578125, 0.4603538513183594, 0.47519683837890625, 0.4900398254394531, 0.5048828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 10.0, 19.0, 22.0, 37.0, 50.0, 88.0, 119.0, 152.0, 177.0, 119.0, 63.0, 53.0, 33.0, 18.0, 8.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000179290771484375, -0.000174802727997303, -0.00017031468451023102, -0.00016582664102315903, -0.00016133859753608704, -0.00015685055404901505, -0.00015236251056194305, -0.00014787446707487106, -0.00014338642358779907, -0.00013889838010072708, -0.0001344103366136551, -0.0001299222931265831, -0.0001254342496395111, -0.00012094620615243912, -0.00011645816266536713, -0.00011197011917829514, -0.00010748207569122314, -0.00010299403220415115, -9.850598871707916e-05, -9.401794523000717e-05, -8.952990174293518e-05, -8.504185825586319e-05, -8.05538147687912e-05, -7.606577128171921e-05, -7.157772779464722e-05, -6.708968430757523e-05, -6.260164082050323e-05, -5.8113597333431244e-05, -5.362555384635925e-05, -4.913751035928726e-05, -4.464946687221527e-05, -4.016142338514328e-05, -3.567337989807129e-05, -3.11853364109993e-05, -2.6697292923927307e-05, -2.2209249436855316e-05, -1.7721205949783325e-05, -1.3233162462711334e-05, -8.745118975639343e-06, -4.257075488567352e-06, 2.3096799850463867e-07, 4.71901148557663e-06, 9.20705497264862e-06, 1.3695098459720612e-05, 1.8183141946792603e-05, 2.2671185433864594e-05, 2.7159228920936584e-05, 3.1647272408008575e-05, 3.6135315895080566e-05, 4.062335938215256e-05, 4.511140286922455e-05, 4.959944635629654e-05, 5.408748984336853e-05, 5.857553333044052e-05, 6.306357681751251e-05, 6.75516203045845e-05, 7.20396637916565e-05, 7.652770727872849e-05, 8.101575076580048e-05, 8.550379425287247e-05, 8.999183773994446e-05, 9.447988122701645e-05, 9.896792471408844e-05, 0.00010345596820116043, 0.00010794401168823242]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 9.0, 6.0, 15.0, 16.0, 33.0, 39.0, 61.0, 106.0, 164.0, 199.0, 398.0, 648.0, 1223.0, 2495.0, 6131.0, 18515.0, 86514.0, 472261.0, 372987.0, 62245.0, 14605.0, 5119.0, 2204.0, 1052.0, 578.0, 318.0, 215.0, 124.0, 74.0, 57.0, 34.0, 37.0, 18.0, 10.0, 10.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.477783203125, -0.46369171142578125, -0.4496002197265625, -0.43550872802734375, -0.421417236328125, -0.40732574462890625, -0.3932342529296875, -0.37914276123046875, -0.36505126953125, -0.35095977783203125, -0.3368682861328125, -0.32277679443359375, -0.308685302734375, -0.29459381103515625, -0.2805023193359375, -0.26641082763671875, -0.2523193359375, -0.23822784423828125, -0.2241363525390625, -0.21004486083984375, -0.195953369140625, -0.18186187744140625, -0.1677703857421875, -0.15367889404296875, -0.13958740234375, -0.12549591064453125, -0.1114044189453125, -0.09731292724609375, -0.083221435546875, -0.06912994384765625, -0.0550384521484375, -0.04094696044921875, -0.02685546875, -0.01276397705078125, 0.0013275146484375, 0.01541900634765625, 0.029510498046875, 0.04360198974609375, 0.0576934814453125, 0.07178497314453125, 0.08587646484375, 0.09996795654296875, 0.1140594482421875, 0.12815093994140625, 0.142242431640625, 0.15633392333984375, 0.1704254150390625, 0.18451690673828125, 0.1986083984375, 0.21269989013671875, 0.2267913818359375, 0.24088287353515625, 0.254974365234375, 0.26906585693359375, 0.2831573486328125, 0.29724884033203125, 0.31134033203125, 0.32543182373046875, 0.3395233154296875, 0.35361480712890625, 0.367706298828125, 0.38179779052734375, 0.3958892822265625, 0.40998077392578125, 0.424072265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 11.0, 15.0, 12.0, 18.0, 24.0, 32.0, 30.0, 50.0, 57.0, 60.0, 84.0, 77.0, 88.0, 85.0, 71.0, 65.0, 50.0, 27.0, 35.0, 24.0, 22.0, 13.0, 9.0, 6.0, 5.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32080078125, -0.3119010925292969, -0.30300140380859375, -0.2941017150878906, -0.2852020263671875, -0.2763023376464844, -0.26740264892578125, -0.2585029602050781, -0.249603271484375, -0.24070358276367188, -0.23180389404296875, -0.22290420532226562, -0.2140045166015625, -0.20510482788085938, -0.19620513916015625, -0.18730545043945312, -0.17840576171875, -0.16950607299804688, -0.16060638427734375, -0.15170669555664062, -0.1428070068359375, -0.13390731811523438, -0.12500762939453125, -0.11610794067382812, -0.107208251953125, -0.09830856323242188, -0.08940887451171875, -0.08050918579101562, -0.0716094970703125, -0.06270980834960938, -0.05381011962890625, -0.044910430908203125, -0.0360107421875, -0.027111053466796875, -0.01821136474609375, -0.009311676025390625, -0.0004119873046875, 0.008487701416015625, 0.01738739013671875, 0.026287078857421875, 0.035186767578125, 0.044086456298828125, 0.05298614501953125, 0.061885833740234375, 0.0707855224609375, 0.07968521118164062, 0.08858489990234375, 0.09748458862304688, 0.10638427734375, 0.11528396606445312, 0.12418365478515625, 0.13308334350585938, 0.1419830322265625, 0.15088272094726562, 0.15978240966796875, 0.16868209838867188, 0.177581787109375, 0.18648147583007812, 0.19538116455078125, 0.20428085327148438, 0.2131805419921875, 0.22208023071289062, 0.23097991943359375, 0.23987960815429688, 0.248779296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 12.0, 18.0, 31.0, 47.0, 89.0, 118.0, 184.0, 169.0, 129.0, 84.0, 49.0, 24.0, 15.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82899284362793, -4.634719371795654, -4.440446376800537, -4.246172904968262, -4.0518999099731445, -3.8576266765594482, -3.663353443145752, -3.4690799713134766, -3.2748069763183594, -3.080533742904663, -2.886260509490967, -2.6919872760772705, -2.497714042663574, -2.303440809249878, -2.1091675758361816, -1.9148942232131958, -1.72062087059021, -1.5263476371765137, -1.3320744037628174, -1.137801170349121, -0.94352787733078, -0.7492546439170837, -0.5549813508987427, -0.3607081174850464, -0.1664348840713501, 0.027838364243507385, 0.22211161255836487, 0.41638487577438354, 0.6106581091880798, 0.8049313426017761, 0.9992046356201172, 1.1934778690338135, 1.3877511024475098, 1.582024335861206, 1.7762975692749023, 1.9705708026885986, 2.164844036102295, 2.359117269515991, 2.5533905029296875, 2.747663974761963, 2.94193696975708, 3.1362102031707764, 3.3304834365844727, 3.524756669998169, 3.7190299034118652, 3.9133031368255615, 4.107576370239258, 4.301849842071533, 4.496123313903809, 4.690396785736084, 4.884669780731201, 5.078943252563477, 5.273216247558594, 5.467489719390869, 5.661762714385986, 5.856036186218262, 6.050309181213379, 6.244582653045654, 6.4388556480407715, 6.633129119873047, 6.827402114868164, 7.0216755867004395, 7.215948581695557, 7.410222053527832, 7.604495048522949]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 17.0, 20.0, 25.0, 25.0, 25.0, 37.0, 55.0, 46.0, 67.0, 65.0, 75.0, 69.0, 66.0, 57.0, 72.0, 53.0, 46.0, 36.0, 39.0, 21.0, 11.0, 17.0, 11.0, 10.0, 3.0, 7.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6068387031555176, -3.4877161979675293, -3.36859393119812, -3.249471426010132, -3.1303491592407227, -3.0112266540527344, -2.892104148864746, -2.772981882095337, -2.6538596153259277, -2.5347371101379395, -2.4156148433685303, -2.296492338180542, -2.177370071411133, -2.0582475662231445, -1.9391251802444458, -1.820002794265747, -1.7008802890777588, -1.58175790309906, -1.4626355171203613, -1.343513011932373, -1.2243907451629639, -1.1052682399749756, -0.9861458539962769, -0.8670234680175781, -0.7479010820388794, -0.6287786960601807, -0.5096563100814819, -0.3905338644981384, -0.2714114785194397, -0.15228909254074097, -0.03316664695739746, 0.08595573902130127, 0.205078125, 0.32420051097869873, 0.44332292675971985, 0.562445342540741, 0.6815677285194397, 0.8006901144981384, 0.9198125600814819, 1.0389349460601807, 1.1580573320388794, 1.2771797180175781, 1.3963021039962769, 1.5154244899749756, 1.6345469951629639, 1.753669261932373, 1.8727917671203613, 1.99191415309906, 2.111036539077759, 2.230159044265747, 2.3492813110351562, 2.4684038162231445, 2.5875260829925537, 2.706648588180542, 2.825770854949951, 2.9448933601379395, 3.0640158653259277, 3.183138370513916, 3.302260637283325, 3.4213831424713135, 3.5405054092407227, 3.659627914428711, 3.778750419616699, 3.8978726863861084, 4.016994953155518]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 15.0, 20.0, 38.0, 50.0, 106.0, 201.0, 393.0, 888.0, 2274.0, 7070.0, 32631.0, 417693.0, 3606772.0, 104860.0, 14798.0, 3773.0, 1307.0, 573.0, 255.0, 154.0, 84.0, 79.0, 60.0, 42.0, 30.0, 24.0, 10.0, 13.0, 7.0, 12.0, 4.0, 10.0, 4.0, 5.0, 4.0, 7.0, 2.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9516143798828125, -0.902252197265625, -0.8528900146484375, -0.80352783203125, -0.7541656494140625, -0.704803466796875, -0.6554412841796875, -0.6060791015625, -0.5567169189453125, -0.507354736328125, -0.4579925537109375, -0.40863037109375, -0.3592681884765625, -0.309906005859375, -0.2605438232421875, -0.211181640625, -0.1618194580078125, -0.112457275390625, -0.0630950927734375, -0.01373291015625, 0.0356292724609375, 0.084991455078125, 0.1343536376953125, 0.1837158203125, 0.2330780029296875, 0.282440185546875, 0.3318023681640625, 0.38116455078125, 0.4305267333984375, 0.479888916015625, 0.5292510986328125, 0.57861328125, 0.6279754638671875, 0.677337646484375, 0.7266998291015625, 0.77606201171875, 0.8254241943359375, 0.874786376953125, 0.9241485595703125, 0.9735107421875, 1.0228729248046875, 1.072235107421875, 1.1215972900390625, 1.17095947265625, 1.2203216552734375, 1.269683837890625, 1.3190460205078125, 1.368408203125, 1.4177703857421875, 1.467132568359375, 1.5164947509765625, 1.56585693359375, 1.6152191162109375, 1.664581298828125, 1.7139434814453125, 1.7633056640625, 1.8126678466796875, 1.862030029296875, 1.9113922119140625, 1.96075439453125, 2.0101165771484375, 2.059478759765625, 2.1088409423828125, 2.158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 8.0, 1.0, 14.0, 6.0, 17.0, 21.0, 33.0, 30.0, 33.0, 45.0, 50.0, 68.0, 60.0, 80.0, 75.0, 65.0, 81.0, 63.0, 64.0, 37.0, 30.0, 31.0, 34.0, 12.0, 10.0, 11.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10406494140625, -0.10026073455810547, -0.09645652770996094, -0.0926523208618164, -0.08884811401367188, -0.08504390716552734, -0.08123970031738281, -0.07743549346923828, -0.07363128662109375, -0.06982707977294922, -0.06602287292480469, -0.062218666076660156, -0.058414459228515625, -0.054610252380371094, -0.05080604553222656, -0.04700183868408203, -0.0431976318359375, -0.03939342498779297, -0.03558921813964844, -0.031785011291503906, -0.027980804443359375, -0.024176597595214844, -0.020372390747070312, -0.01656818389892578, -0.01276397705078125, -0.008959770202636719, -0.0051555633544921875, -0.0013513565063476562, 0.002452850341796875, 0.006257057189941406, 0.010061264038085938, 0.013865470886230469, 0.017669677734375, 0.02147388458251953, 0.025278091430664062, 0.029082298278808594, 0.032886505126953125, 0.036690711975097656, 0.04049491882324219, 0.04429912567138672, 0.04810333251953125, 0.05190753936767578, 0.05571174621582031, 0.059515953063964844, 0.06332015991210938, 0.0671243667602539, 0.07092857360839844, 0.07473278045654297, 0.0785369873046875, 0.08234119415283203, 0.08614540100097656, 0.0899496078491211, 0.09375381469726562, 0.09755802154541016, 0.10136222839355469, 0.10516643524169922, 0.10897064208984375, 0.11277484893798828, 0.11657905578613281, 0.12038326263427734, 0.12418746948242188, 0.1279916763305664, 0.13179588317871094, 0.13560009002685547, 0.139404296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 13.0, 12.0, 14.0, 25.0, 61.0, 98.0, 166.0, 452.0, 1361.0, 9178.0, 4036700.0, 140420.0, 4102.0, 987.0, 328.0, 150.0, 80.0, 46.0, 33.0, 18.0, 11.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.97265625, -6.801788330078125, -6.63092041015625, -6.460052490234375, -6.2891845703125, -6.118316650390625, -5.94744873046875, -5.776580810546875, -5.605712890625, -5.434844970703125, -5.26397705078125, -5.093109130859375, -4.9222412109375, -4.751373291015625, -4.58050537109375, -4.409637451171875, -4.23876953125, -4.067901611328125, -3.89703369140625, -3.726165771484375, -3.5552978515625, -3.384429931640625, -3.21356201171875, -3.042694091796875, -2.871826171875, -2.700958251953125, -2.53009033203125, -2.359222412109375, -2.1883544921875, -2.017486572265625, -1.84661865234375, -1.675750732421875, -1.5048828125, -1.334014892578125, -1.16314697265625, -0.992279052734375, -0.8214111328125, -0.650543212890625, -0.47967529296875, -0.308807373046875, -0.137939453125, 0.032928466796875, 0.20379638671875, 0.374664306640625, 0.5455322265625, 0.716400146484375, 0.88726806640625, 1.058135986328125, 1.22900390625, 1.399871826171875, 1.57073974609375, 1.741607666015625, 1.9124755859375, 2.083343505859375, 2.25421142578125, 2.425079345703125, 2.595947265625, 2.766815185546875, 2.93768310546875, 3.108551025390625, 3.2794189453125, 3.450286865234375, 3.62115478515625, 3.792022705078125, 3.962890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 20.0, 23.0, 35.0, 79.0, 155.0, 376.0, 1652.0, 1174.0, 300.0, 120.0, 66.0, 23.0, 18.0, 11.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351318359375, -0.3304786682128906, -0.30963897705078125, -0.2887992858886719, -0.2679595947265625, -0.24711990356445312, -0.22628021240234375, -0.20544052124023438, -0.184600830078125, -0.16376113891601562, -0.14292144775390625, -0.12208175659179688, -0.1012420654296875, -0.08040237426757812, -0.05956268310546875, -0.038722991943359375, -0.01788330078125, 0.002956390380859375, 0.02379608154296875, 0.044635772705078125, 0.0654754638671875, 0.08631515502929688, 0.10715484619140625, 0.12799453735351562, 0.148834228515625, 0.16967391967773438, 0.19051361083984375, 0.21135330200195312, 0.2321929931640625, 0.2530326843261719, 0.27387237548828125, 0.2947120666503906, 0.3155517578125, 0.3363914489746094, 0.35723114013671875, 0.3780708312988281, 0.3989105224609375, 0.4197502136230469, 0.44058990478515625, 0.4614295959472656, 0.482269287109375, 0.5031089782714844, 0.5239486694335938, 0.5447883605957031, 0.5656280517578125, 0.5864677429199219, 0.6073074340820312, 0.6281471252441406, 0.64898681640625, 0.6698265075683594, 0.6906661987304688, 0.7115058898925781, 0.7323455810546875, 0.7531852722167969, 0.7740249633789062, 0.7948646545410156, 0.815704345703125, 0.8365440368652344, 0.8573837280273438, 0.8782234191894531, 0.8990631103515625, 0.9199028015136719, 0.9407424926757812, 0.9615821838378906, 0.982421875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 7.0, 22.0, 75.0, 255.0, 396.0, 175.0, 45.0, 20.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.42778491973877, -8.139674186706543, -7.851562976837158, -7.563452243804932, -7.275341033935547, -6.98723030090332, -6.699119567871094, -6.411008834838867, -6.122897624969482, -5.834786891937256, -5.546675682067871, -5.2585649490356445, -4.970454216003418, -4.682343006134033, -4.394232273101807, -4.106121063232422, -3.8180103302001953, -3.5298993587493896, -3.241788387298584, -2.9536776542663574, -2.6655666828155518, -2.377455711364746, -2.0893449783325195, -1.8012340068817139, -1.5131230354309082, -1.2250120639801025, -0.9369012117385864, -0.6487902998924255, -0.36067938804626465, -0.07256841659545898, 0.21554243564605713, 0.5036532878875732, 0.7917652130126953, 1.079876184463501, 1.367987036705017, 1.6560978889465332, 1.9442088603973389, 2.2323198318481445, 2.520430564880371, 2.8085415363311768, 3.0966525077819824, 3.384763479232788, 3.6728744506835938, 3.9609851837158203, 4.249095916748047, 4.537207126617432, 4.825317859649658, 5.113429069519043, 5.4015398025512695, 5.689650535583496, 5.977761745452881, 6.265872478485107, 6.553983688354492, 6.842094421386719, 7.130205154418945, 7.418315887451172, 7.706427097320557, 7.994537830352783, 8.282649040222168, 8.570759773254395, 8.858870506286621, 9.146982192993164, 9.43509292602539, 9.723203659057617, 10.011314392089844]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 9.0, 13.0, 19.0, 28.0, 32.0, 54.0, 55.0, 81.0, 72.0, 60.0, 86.0, 88.0, 71.0, 73.0, 56.0, 53.0, 33.0, 26.0, 28.0, 19.0, 12.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9469283819198608, -1.8755866289138794, -1.8042447566986084, -1.732903003692627, -1.661561131477356, -1.5902193784713745, -1.5188775062561035, -1.447535753250122, -1.3761940002441406, -1.3048522472381592, -1.2335103750228882, -1.1621686220169067, -1.0908267498016357, -1.0194849967956543, -0.9481431841850281, -0.8768013715744019, -0.8054594993591309, -0.7341176867485046, -0.6627758741378784, -0.591434121131897, -0.520092248916626, -0.44875046610832214, -0.3774086833000183, -0.3060668706893921, -0.23472505807876587, -0.16338324546813965, -0.09204144775867462, -0.020699650049209595, 0.050642162561416626, 0.12198397517204285, 0.19332575798034668, 0.2646675705909729, 0.33600926399230957, 0.4073510766029358, 0.478692889213562, 0.5500346422195435, 0.6213765144348145, 0.6927182674407959, 0.7640600800514221, 0.8354018926620483, 0.9067437052726746, 0.9780855178833008, 1.0494272708892822, 1.1207691431045532, 1.1921108961105347, 1.2634527683258057, 1.334794521331787, 1.4061362743377686, 1.4774781465530396, 1.548819899559021, 1.620161771774292, 1.6915035247802734, 1.7628453969955444, 1.8341871500015259, 1.9055290222167969, 1.9768707752227783, 2.0482125282287598, 2.119554281234741, 2.1908960342407227, 2.262238025665283, 2.3335797786712646, 2.404921531677246, 2.4762632846832275, 2.547605037689209, 2.6189470291137695]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 10.0, 13.0, 13.0, 25.0, 25.0, 41.0, 75.0, 94.0, 202.0, 323.0, 635.0, 1252.0, 3218.0, 12596.0, 105910.0, 661141.0, 231879.0, 22999.0, 4623.0, 1640.0, 792.0, 400.0, 217.0, 137.0, 82.0, 74.0, 33.0, 28.0, 24.0, 15.0, 8.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8779296875, -1.8267059326171875, -1.775482177734375, -1.7242584228515625, -1.67303466796875, -1.6218109130859375, -1.570587158203125, -1.5193634033203125, -1.4681396484375, -1.4169158935546875, -1.365692138671875, -1.3144683837890625, -1.26324462890625, -1.2120208740234375, -1.160797119140625, -1.1095733642578125, -1.058349609375, -1.0071258544921875, -0.955902099609375, -0.9046783447265625, -0.85345458984375, -0.8022308349609375, -0.751007080078125, -0.6997833251953125, -0.6485595703125, -0.5973358154296875, -0.546112060546875, -0.4948883056640625, -0.44366455078125, -0.3924407958984375, -0.341217041015625, -0.2899932861328125, -0.23876953125, -0.1875457763671875, -0.136322021484375, -0.0850982666015625, -0.03387451171875, 0.0173492431640625, 0.068572998046875, 0.1197967529296875, 0.1710205078125, 0.2222442626953125, 0.273468017578125, 0.3246917724609375, 0.37591552734375, 0.4271392822265625, 0.478363037109375, 0.5295867919921875, 0.580810546875, 0.6320343017578125, 0.683258056640625, 0.7344818115234375, 0.78570556640625, 0.8369293212890625, 0.888153076171875, 0.9393768310546875, 0.9906005859375, 1.0418243408203125, 1.093048095703125, 1.1442718505859375, 1.19549560546875, 1.2467193603515625, 1.297943115234375, 1.3491668701171875, 1.400390625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 12.0, 16.0, 22.0, 32.0, 53.0, 73.0, 96.0, 107.0, 125.0, 108.0, 123.0, 69.0, 62.0, 44.0, 19.0, 16.0, 9.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.1978168487548828, -0.19067764282226562, -0.18353843688964844, -0.17639923095703125, -0.16926002502441406, -0.16212081909179688, -0.1549816131591797, -0.1478424072265625, -0.1407032012939453, -0.13356399536132812, -0.12642478942871094, -0.11928558349609375, -0.11214637756347656, -0.10500717163085938, -0.09786796569824219, -0.090728759765625, -0.08358955383300781, -0.07645034790039062, -0.06931114196777344, -0.06217193603515625, -0.05503273010253906, -0.047893524169921875, -0.04075431823730469, -0.0336151123046875, -0.026475906372070312, -0.019336700439453125, -0.012197494506835938, -0.00505828857421875, 0.0020809173583984375, 0.009220123291015625, 0.016359329223632812, 0.02349853515625, 0.030637741088867188, 0.037776947021484375, 0.04491615295410156, 0.05205535888671875, 0.05919456481933594, 0.06633377075195312, 0.07347297668457031, 0.0806121826171875, 0.08775138854980469, 0.09489059448242188, 0.10202980041503906, 0.10916900634765625, 0.11630821228027344, 0.12344741821289062, 0.1305866241455078, 0.137725830078125, 0.1448650360107422, 0.15200424194335938, 0.15914344787597656, 0.16628265380859375, 0.17342185974121094, 0.18056106567382812, 0.1877002716064453, 0.1948394775390625, 0.2019786834716797, 0.20911788940429688, 0.21625709533691406, 0.22339630126953125, 0.23053550720214844, 0.23767471313476562, 0.2448139190673828, 0.251953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 11.0, 9.0, 24.0, 29.0, 40.0, 31.0, 72.0, 86.0, 133.0, 219.0, 309.0, 546.0, 869.0, 1580.0, 3083.0, 6169.0, 13531.0, 30424.0, 69000.0, 144585.0, 243357.0, 249579.0, 151539.0, 72730.0, 32453.0, 14286.0, 6552.0, 3196.0, 1638.0, 915.0, 568.0, 354.0, 206.0, 140.0, 85.0, 52.0, 36.0, 31.0, 27.0, 14.0, 8.0, 8.0, 8.0, 1.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.416259765625, -0.40402984619140625, -0.3917999267578125, -0.37957000732421875, -0.367340087890625, -0.35511016845703125, -0.3428802490234375, -0.33065032958984375, -0.31842041015625, -0.30619049072265625, -0.2939605712890625, -0.28173065185546875, -0.269500732421875, -0.25727081298828125, -0.2450408935546875, -0.23281097412109375, -0.2205810546875, -0.20835113525390625, -0.1961212158203125, -0.18389129638671875, -0.171661376953125, -0.15943145751953125, -0.1472015380859375, -0.13497161865234375, -0.12274169921875, -0.11051177978515625, -0.0982818603515625, -0.08605194091796875, -0.073822021484375, -0.06159210205078125, -0.0493621826171875, -0.03713226318359375, -0.02490234375, -0.01267242431640625, -0.0004425048828125, 0.01178741455078125, 0.024017333984375, 0.03624725341796875, 0.0484771728515625, 0.06070709228515625, 0.07293701171875, 0.08516693115234375, 0.0973968505859375, 0.10962677001953125, 0.121856689453125, 0.13408660888671875, 0.1463165283203125, 0.15854644775390625, 0.1707763671875, 0.18300628662109375, 0.1952362060546875, 0.20746612548828125, 0.219696044921875, 0.23192596435546875, 0.2441558837890625, 0.25638580322265625, 0.26861572265625, 0.28084564208984375, 0.2930755615234375, 0.30530548095703125, 0.317535400390625, 0.32976531982421875, 0.3419952392578125, 0.35422515869140625, 0.366455078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 6.0, 6.0, 16.0, 23.0, 22.0, 24.0, 27.0, 32.0, 35.0, 39.0, 36.0, 43.0, 33.0, 45.0, 46.0, 37.0, 55.0, 36.0, 38.0, 50.0, 39.0, 41.0, 35.0, 34.0, 33.0, 29.0, 17.0, 17.0, 11.0, 21.0, 12.0, 10.0, 9.0, 9.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.417724609375, -0.4046974182128906, -0.39167022705078125, -0.3786430358886719, -0.3656158447265625, -0.3525886535644531, -0.33956146240234375, -0.3265342712402344, -0.313507080078125, -0.3004798889160156, -0.28745269775390625, -0.2744255065917969, -0.2613983154296875, -0.24837112426757812, -0.23534393310546875, -0.22231674194335938, -0.20928955078125, -0.19626235961914062, -0.18323516845703125, -0.17020797729492188, -0.1571807861328125, -0.14415359497070312, -0.13112640380859375, -0.11809921264648438, -0.105072021484375, -0.09204483032226562, -0.07901763916015625, -0.06599044799804688, -0.0529632568359375, -0.039936065673828125, -0.02690887451171875, -0.013881683349609375, -0.0008544921875, 0.012172698974609375, 0.02519989013671875, 0.038227081298828125, 0.0512542724609375, 0.06428146362304688, 0.07730865478515625, 0.09033584594726562, 0.103363037109375, 0.11639022827148438, 0.12941741943359375, 0.14244461059570312, 0.1554718017578125, 0.16849899291992188, 0.18152618408203125, 0.19455337524414062, 0.20758056640625, 0.22060775756835938, 0.23363494873046875, 0.24666213989257812, 0.2596893310546875, 0.2727165222167969, 0.28574371337890625, 0.2987709045410156, 0.311798095703125, 0.3248252868652344, 0.33785247802734375, 0.3508796691894531, 0.3639068603515625, 0.3769340515136719, 0.38996124267578125, 0.4029884338378906, 0.416015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 23.0, 51.0, 82.0, 113.0, 243.0, 456.0, 1142.0, 3925.0, 20118.0, 170189.0, 639023.0, 185171.0, 21862.0, 3982.0, 1120.0, 478.0, 242.0, 116.0, 82.0, 42.0, 25.0, 12.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6822967529296875, -0.665863037109375, -0.6494293212890625, -0.63299560546875, -0.6165618896484375, -0.600128173828125, -0.5836944580078125, -0.5672607421875, -0.5508270263671875, -0.534393310546875, -0.5179595947265625, -0.50152587890625, -0.4850921630859375, -0.468658447265625, -0.4522247314453125, -0.435791015625, -0.4193572998046875, -0.402923583984375, -0.3864898681640625, -0.37005615234375, -0.3536224365234375, -0.337188720703125, -0.3207550048828125, -0.3043212890625, -0.2878875732421875, -0.271453857421875, -0.2550201416015625, -0.23858642578125, -0.2221527099609375, -0.205718994140625, -0.1892852783203125, -0.1728515625, -0.1564178466796875, -0.139984130859375, -0.1235504150390625, -0.10711669921875, -0.0906829833984375, -0.074249267578125, -0.0578155517578125, -0.0413818359375, -0.0249481201171875, -0.008514404296875, 0.0079193115234375, 0.02435302734375, 0.0407867431640625, 0.057220458984375, 0.0736541748046875, 0.090087890625, 0.1065216064453125, 0.122955322265625, 0.1393890380859375, 0.15582275390625, 0.1722564697265625, 0.188690185546875, 0.2051239013671875, 0.2215576171875, 0.2379913330078125, 0.254425048828125, 0.2708587646484375, 0.28729248046875, 0.3037261962890625, 0.320159912109375, 0.3365936279296875, 0.35302734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 10.0, 26.0, 21.0, 25.0, 30.0, 41.0, 39.0, 40.0, 52.0, 42.0, 57.0, 61.0, 55.0, 63.0, 52.0, 40.0, 43.0, 42.0, 32.0, 25.0, 17.0, 20.0, 20.0, 18.0, 9.0, 16.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.774332046508789e-05, -4.627928137779236e-05, -4.4815242290496826e-05, -4.3351203203201294e-05, -4.188716411590576e-05, -4.042312502861023e-05, -3.89590859413147e-05, -3.7495046854019165e-05, -3.603100776672363e-05, -3.45669686794281e-05, -3.310292959213257e-05, -3.1638890504837036e-05, -3.0174851417541504e-05, -2.871081233024597e-05, -2.724677324295044e-05, -2.5782734155654907e-05, -2.4318695068359375e-05, -2.2854655981063843e-05, -2.139061689376831e-05, -1.992657780647278e-05, -1.8462538719177246e-05, -1.6998499631881714e-05, -1.553446054458618e-05, -1.407042145729065e-05, -1.2606382369995117e-05, -1.1142343282699585e-05, -9.678304195404053e-06, -8.21426510810852e-06, -6.750226020812988e-06, -5.286186933517456e-06, -3.822147846221924e-06, -2.3581087589263916e-06, -8.940696716308594e-07, 5.699694156646729e-07, 2.034008502960205e-06, 3.4980475902557373e-06, 4.9620866775512695e-06, 6.426125764846802e-06, 7.890164852142334e-06, 9.354203939437866e-06, 1.0818243026733398e-05, 1.228228211402893e-05, 1.3746321201324463e-05, 1.5210360288619995e-05, 1.6674399375915527e-05, 1.813843846321106e-05, 1.9602477550506592e-05, 2.1066516637802124e-05, 2.2530555725097656e-05, 2.399459481239319e-05, 2.545863389968872e-05, 2.6922672986984253e-05, 2.8386712074279785e-05, 2.9850751161575317e-05, 3.131479024887085e-05, 3.277882933616638e-05, 3.4242868423461914e-05, 3.5706907510757446e-05, 3.717094659805298e-05, 3.863498568534851e-05, 4.009902477264404e-05, 4.1563063859939575e-05, 4.302710294723511e-05, 4.449114203453064e-05, 4.595518112182617e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 5.0, 3.0, 15.0, 20.0, 24.0, 40.0, 51.0, 84.0, 170.0, 295.0, 556.0, 1138.0, 2745.0, 7517.0, 26589.0, 117445.0, 406685.0, 360532.0, 92858.0, 21109.0, 6050.0, 2281.0, 1101.0, 495.0, 298.0, 145.0, 112.0, 62.0, 39.0, 31.0, 22.0, 12.0, 5.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36572265625, -0.3552513122558594, -0.34477996826171875, -0.3343086242675781, -0.3238372802734375, -0.3133659362792969, -0.30289459228515625, -0.2924232482910156, -0.281951904296875, -0.2714805603027344, -0.26100921630859375, -0.2505378723144531, -0.2400665283203125, -0.22959518432617188, -0.21912384033203125, -0.20865249633789062, -0.19818115234375, -0.18770980834960938, -0.17723846435546875, -0.16676712036132812, -0.1562957763671875, -0.14582443237304688, -0.13535308837890625, -0.12488174438476562, -0.114410400390625, -0.10393905639648438, -0.09346771240234375, -0.08299636840820312, -0.0725250244140625, -0.062053680419921875, -0.05158233642578125, -0.041110992431640625, -0.0306396484375, -0.020168304443359375, -0.00969696044921875, 0.000774383544921875, 0.0112457275390625, 0.021717071533203125, 0.03218841552734375, 0.042659759521484375, 0.053131103515625, 0.06360244750976562, 0.07407379150390625, 0.08454513549804688, 0.0950164794921875, 0.10548782348632812, 0.11595916748046875, 0.12643051147460938, 0.13690185546875, 0.14737319946289062, 0.15784454345703125, 0.16831588745117188, 0.1787872314453125, 0.18925857543945312, 0.19972991943359375, 0.21020126342773438, 0.220672607421875, 0.23114395141601562, 0.24161529541015625, 0.2520866394042969, 0.2625579833984375, 0.2730293273925781, 0.28350067138671875, 0.2939720153808594, 0.304443359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 10.0, 15.0, 15.0, 28.0, 24.0, 47.0, 52.0, 64.0, 62.0, 98.0, 78.0, 78.0, 69.0, 74.0, 70.0, 38.0, 39.0, 34.0, 25.0, 18.0, 12.0, 12.0, 9.0, 3.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2213134765625, -0.21305274963378906, -0.20479202270507812, -0.1965312957763672, -0.18827056884765625, -0.1800098419189453, -0.17174911499023438, -0.16348838806152344, -0.1552276611328125, -0.14696693420410156, -0.13870620727539062, -0.1304454803466797, -0.12218475341796875, -0.11392402648925781, -0.10566329956054688, -0.09740257263183594, -0.089141845703125, -0.08088111877441406, -0.07262039184570312, -0.06435966491699219, -0.05609893798828125, -0.04783821105957031, -0.039577484130859375, -0.03131675720214844, -0.0230560302734375, -0.014795303344726562, -0.006534576416015625, 0.0017261505126953125, 0.00998687744140625, 0.018247604370117188, 0.026508331298828125, 0.03476905822753906, 0.04302978515625, 0.05129051208496094, 0.059551239013671875, 0.06781196594238281, 0.07607269287109375, 0.08433341979980469, 0.09259414672851562, 0.10085487365722656, 0.1091156005859375, 0.11737632751464844, 0.12563705444335938, 0.1338977813720703, 0.14215850830078125, 0.1504192352294922, 0.15867996215820312, 0.16694068908691406, 0.175201416015625, 0.18346214294433594, 0.19172286987304688, 0.1999835968017578, 0.20824432373046875, 0.2165050506591797, 0.22476577758789062, 0.23302650451660156, 0.2412872314453125, 0.24954795837402344, 0.2578086853027344, 0.2660694122314453, 0.27433013916015625, 0.2825908660888672, 0.2908515930175781, 0.29911231994628906, 0.307373046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 12.0, 12.0, 32.0, 67.0, 90.0, 133.0, 171.0, 186.0, 111.0, 78.0, 53.0, 31.0, 14.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09897232055664, -7.904950141906738, -7.710928440093994, -7.516906261444092, -7.322884559631348, -7.128862380981445, -6.934840202331543, -6.740818023681641, -6.5467963218688965, -6.352774143218994, -6.15875244140625, -5.964730262756348, -5.770708084106445, -5.576686382293701, -5.382664203643799, -5.188642501831055, -4.994620323181152, -4.80059814453125, -4.606576442718506, -4.4125542640686035, -4.218532562255859, -4.024510383605957, -3.8304882049560547, -3.6364662647247314, -3.442444324493408, -3.248422384262085, -3.0544004440307617, -2.8603782653808594, -2.666356325149536, -2.472334384918213, -2.2783122062683105, -2.0842902660369873, -1.890268325805664, -1.6962463855743408, -1.502224326133728, -1.3082022666931152, -1.114180326461792, -0.920158326625824, -0.726136326789856, -0.5321142673492432, -0.3380923271179199, -0.1440703272819519, 0.04995167255401611, 0.24397367238998413, 0.43799567222595215, 0.6320176720619202, 0.8260396718978882, 1.020061731338501, 1.2140836715698242, 1.4081056118011475, 1.6021276712417603, 1.796149730682373, 1.9901716709136963, 2.1841936111450195, 2.378215789794922, 2.572237730026245, 2.7662596702575684, 2.9602816104888916, 3.154303550720215, 3.348325729370117, 3.5423476696014404, 3.7363696098327637, 3.930391788482666, 4.12441349029541, 4.3184356689453125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 10.0, 8.0, 9.0, 16.0, 14.0, 15.0, 19.0, 23.0, 21.0, 24.0, 23.0, 36.0, 49.0, 49.0, 38.0, 42.0, 67.0, 56.0, 55.0, 47.0, 46.0, 42.0, 43.0, 46.0, 31.0, 28.0, 31.0, 13.0, 21.0, 19.0, 9.0, 13.0, 7.0, 12.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8482842445373535, -2.7652475833892822, -2.682210922241211, -2.5991744995117188, -2.5161378383636475, -2.433101177215576, -2.350064516067505, -2.2670278549194336, -2.1839914321899414, -2.10095477104187, -2.017918109893799, -1.934881567955017, -1.8518450260162354, -1.768808364868164, -1.6857717037200928, -1.6027350425720215, -1.5196983814239502, -1.436661720275879, -1.3536251783370972, -1.2705885171890259, -1.1875519752502441, -1.1045153141021729, -1.0214786529541016, -0.938442051410675, -0.8554054498672485, -0.772368848323822, -0.6893322467803955, -0.6062955856323242, -0.5232589840888977, -0.4402223825454712, -0.3571857511997223, -0.2741491198539734, -0.19111251831054688, -0.10807590186595917, -0.02503928542137146, 0.05799733102321625, 0.14103394746780396, 0.22407054901123047, 0.30710718035697937, 0.39014381170272827, 0.4731804132461548, 0.5562170147895813, 0.6392536163330078, 0.7222902774810791, 0.8053268790245056, 0.8883634805679321, 0.9714001417160034, 1.0544366836547852, 1.1374733448028564, 1.2205100059509277, 1.3035465478897095, 1.3865832090377808, 1.4696197509765625, 1.5526564121246338, 1.635693073272705, 1.7187297344207764, 1.801766276359558, 1.8848029375076294, 1.9678394794464111, 2.0508761405944824, 2.1339128017425537, 2.216949462890625, 2.299985885620117, 2.3830225467681885, 2.4660592079162598]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 14.0, 10.0, 20.0, 30.0, 48.0, 61.0, 108.0, 160.0, 361.0, 793.0, 2220.0, 9289.0, 110831.0, 3991566.0, 68126.0, 7455.0, 1782.0, 632.0, 256.0, 154.0, 104.0, 69.0, 53.0, 26.0, 22.0, 13.0, 16.0, 9.0, 5.0, 13.0, 5.0, 3.0, 5.0, 6.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7939453125, -1.7308502197265625, -1.667755126953125, -1.6046600341796875, -1.54156494140625, -1.4784698486328125, -1.415374755859375, -1.3522796630859375, -1.2891845703125, -1.2260894775390625, -1.162994384765625, -1.0998992919921875, -1.03680419921875, -0.9737091064453125, -0.910614013671875, -0.8475189208984375, -0.784423828125, -0.7213287353515625, -0.658233642578125, -0.5951385498046875, -0.53204345703125, -0.4689483642578125, -0.405853271484375, -0.3427581787109375, -0.2796630859375, -0.2165679931640625, -0.153472900390625, -0.0903778076171875, -0.02728271484375, 0.0358123779296875, 0.098907470703125, 0.1620025634765625, 0.22509765625, 0.2881927490234375, 0.351287841796875, 0.4143829345703125, 0.47747802734375, 0.5405731201171875, 0.603668212890625, 0.6667633056640625, 0.7298583984375, 0.7929534912109375, 0.856048583984375, 0.9191436767578125, 0.98223876953125, 1.0453338623046875, 1.108428955078125, 1.1715240478515625, 1.234619140625, 1.2977142333984375, 1.360809326171875, 1.4239044189453125, 1.48699951171875, 1.5500946044921875, 1.613189697265625, 1.6762847900390625, 1.7393798828125, 1.8024749755859375, 1.865570068359375, 1.9286651611328125, 1.99176025390625, 2.0548553466796875, 2.117950439453125, 2.1810455322265625, 2.244140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 9.0, 17.0, 22.0, 29.0, 28.0, 47.0, 53.0, 80.0, 82.0, 103.0, 98.0, 104.0, 74.0, 69.0, 53.0, 31.0, 32.0, 22.0, 14.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173828125, -0.1680622100830078, -0.16229629516601562, -0.15653038024902344, -0.15076446533203125, -0.14499855041503906, -0.13923263549804688, -0.1334667205810547, -0.1277008056640625, -0.12193489074707031, -0.11616897583007812, -0.11040306091308594, -0.10463714599609375, -0.09887123107910156, -0.09310531616210938, -0.08733940124511719, -0.081573486328125, -0.07580757141113281, -0.07004165649414062, -0.06427574157714844, -0.05850982666015625, -0.05274391174316406, -0.046977996826171875, -0.04121208190917969, -0.0354461669921875, -0.029680252075195312, -0.023914337158203125, -0.018148422241210938, -0.01238250732421875, -0.0066165924072265625, -0.000850677490234375, 0.0049152374267578125, 0.01068115234375, 0.016447067260742188, 0.022212982177734375, 0.027978897094726562, 0.03374481201171875, 0.03951072692871094, 0.045276641845703125, 0.05104255676269531, 0.0568084716796875, 0.06257438659667969, 0.06834030151367188, 0.07410621643066406, 0.07987213134765625, 0.08563804626464844, 0.09140396118164062, 0.09716987609863281, 0.102935791015625, 0.10870170593261719, 0.11446762084960938, 0.12023353576660156, 0.12599945068359375, 0.13176536560058594, 0.13753128051757812, 0.1432971954345703, 0.1490631103515625, 0.1548290252685547, 0.16059494018554688, 0.16636085510253906, 0.17212677001953125, 0.17789268493652344, 0.18365859985351562, 0.1894245147705078, 0.1951904296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 11.0, 16.0, 16.0, 41.0, 53.0, 81.0, 116.0, 205.0, 323.0, 651.0, 1190.0, 2380.0, 5614.0, 16154.0, 67340.0, 720778.0, 3170027.0, 165150.0, 28746.0, 8435.0, 3368.0, 1547.0, 797.0, 482.0, 254.0, 201.0, 106.0, 71.0, 40.0, 28.0, 18.0, 14.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8058624267578125, -0.779205322265625, -0.7525482177734375, -0.72589111328125, -0.6992340087890625, -0.672576904296875, -0.6459197998046875, -0.6192626953125, -0.5926055908203125, -0.565948486328125, -0.5392913818359375, -0.51263427734375, -0.4859771728515625, -0.459320068359375, -0.4326629638671875, -0.406005859375, -0.3793487548828125, -0.352691650390625, -0.3260345458984375, -0.29937744140625, -0.2727203369140625, -0.246063232421875, -0.2194061279296875, -0.1927490234375, -0.1660919189453125, -0.139434814453125, -0.1127777099609375, -0.08612060546875, -0.0594635009765625, -0.032806396484375, -0.0061492919921875, 0.0205078125, 0.0471649169921875, 0.073822021484375, 0.1004791259765625, 0.12713623046875, 0.1537933349609375, 0.180450439453125, 0.2071075439453125, 0.2337646484375, 0.2604217529296875, 0.287078857421875, 0.3137359619140625, 0.34039306640625, 0.3670501708984375, 0.393707275390625, 0.4203643798828125, 0.447021484375, 0.4736785888671875, 0.500335693359375, 0.5269927978515625, 0.55364990234375, 0.5803070068359375, 0.606964111328125, 0.6336212158203125, 0.6602783203125, 0.6869354248046875, 0.713592529296875, 0.7402496337890625, 0.76690673828125, 0.7935638427734375, 0.820220947265625, 0.8468780517578125, 0.87353515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 20.0, 27.0, 25.0, 41.0, 74.0, 107.0, 184.0, 500.0, 1233.0, 991.0, 381.0, 186.0, 100.0, 70.0, 35.0, 24.0, 12.0, 9.0, 9.0, 9.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24691390991210938, -0.23699188232421875, -0.22706985473632812, -0.2171478271484375, -0.20722579956054688, -0.19730377197265625, -0.18738174438476562, -0.177459716796875, -0.16753768920898438, -0.15761566162109375, -0.14769363403320312, -0.1377716064453125, -0.12784957885742188, -0.11792755126953125, -0.10800552368164062, -0.09808349609375, -0.08816146850585938, -0.07823944091796875, -0.06831741333007812, -0.0583953857421875, -0.048473358154296875, -0.03855133056640625, -0.028629302978515625, -0.018707275390625, -0.008785247802734375, 0.00113677978515625, 0.011058807373046875, 0.0209808349609375, 0.030902862548828125, 0.04082489013671875, 0.050746917724609375, 0.0606689453125, 0.07059097290039062, 0.08051300048828125, 0.09043502807617188, 0.1003570556640625, 0.11027908325195312, 0.12020111083984375, 0.13012313842773438, 0.140045166015625, 0.14996719360351562, 0.15988922119140625, 0.16981124877929688, 0.1797332763671875, 0.18965530395507812, 0.19957733154296875, 0.20949935913085938, 0.21942138671875, 0.22934341430664062, 0.23926544189453125, 0.24918746948242188, 0.2591094970703125, 0.2690315246582031, 0.27895355224609375, 0.2888755798339844, 0.298797607421875, 0.3087196350097656, 0.31864166259765625, 0.3285636901855469, 0.3384857177734375, 0.3484077453613281, 0.35832977294921875, 0.3682518005371094, 0.378173828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 15.0, 28.0, 106.0, 225.0, 327.0, 206.0, 63.0, 26.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.445000648498535, -4.303231716156006, -4.161463260650635, -4.0196943283081055, -3.8779256343841553, -3.736156940460205, -3.594388008117676, -3.4526193141937256, -3.3108506202697754, -3.169081926345825, -3.027313232421875, -2.8855443000793457, -2.7437756061553955, -2.6020069122314453, -2.460237979888916, -2.318469285964966, -2.1767005920410156, -2.0349318981170654, -1.8931630849838257, -1.751394271850586, -1.6096255779266357, -1.4678568840026855, -1.3260880708694458, -1.184319257736206, -1.0425505638122559, -0.9007818102836609, -0.7590130567550659, -0.617244303226471, -0.475475549697876, -0.333706796169281, -0.19193804264068604, -0.050169289112091064, 0.0915989875793457, 0.23336774110794067, 0.37513649463653564, 0.5169052481651306, 0.6586740016937256, 0.8004427552223206, 0.9422115087509155, 1.0839803218841553, 1.2257490158081055, 1.3675177097320557, 1.5092865228652954, 1.6510553359985352, 1.7928240299224854, 1.9345927238464355, 2.076361656188965, 2.218130350112915, 2.3598990440368652, 2.5016677379608154, 2.6434364318847656, 2.785205364227295, 2.926974058151245, 3.0687427520751953, 3.2105116844177246, 3.352280378341675, 3.494049072265625, 3.635817766189575, 3.7775864601135254, 3.9193553924560547, 4.061123847961426, 4.202892780303955, 4.344661712646484, 4.4864301681518555, 4.628199100494385]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 10.0, 8.0, 10.0, 8.0, 11.0, 17.0, 20.0, 21.0, 25.0, 35.0, 50.0, 28.0, 44.0, 43.0, 55.0, 51.0, 53.0, 49.0, 51.0, 53.0, 40.0, 42.0, 21.0, 34.0, 43.0, 28.0, 28.0, 24.0, 13.0, 14.0, 16.0, 13.0, 12.0, 6.0, 9.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.898186981678009, -0.8695569634437561, -0.840927004814148, -0.812296986579895, -0.7836670279502869, -0.7550370097160339, -0.7264070510864258, -0.6977770328521729, -0.6691470146179199, -0.640516996383667, -0.6118870377540588, -0.5832570195198059, -0.5546270608901978, -0.5259970426559448, -0.4973670542240143, -0.46873706579208374, -0.4401070773601532, -0.41147708892822266, -0.3828471004962921, -0.3542171120643616, -0.32558709383010864, -0.2969571053981781, -0.26832711696624756, -0.23969711363315582, -0.21106712520122528, -0.18243713676929474, -0.153807133436203, -0.12517714500427246, -0.09654714912176132, -0.06791715323925018, -0.03928716480731964, -0.010657161474227905, 0.017972826957702637, 0.046602822840213776, 0.07523281872272491, 0.10386280715465546, 0.1324928104877472, 0.16112279891967773, 0.18975278735160828, 0.2183827906847, 0.24701277911663055, 0.2756427824497223, 0.30427277088165283, 0.3329027593135834, 0.3615327477455139, 0.39016276597976685, 0.418792724609375, 0.44742274284362793, 0.47605273127555847, 0.504682719707489, 0.5333127379417419, 0.5619426965713501, 0.590572714805603, 0.619202733039856, 0.6478326916694641, 0.676462709903717, 0.7050926685333252, 0.7337226867675781, 0.7623526453971863, 0.7909826636314392, 0.8196126222610474, 0.8482426404953003, 0.8768726587295532, 0.9055026173591614, 0.9341326355934143]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 13.0, 15.0, 12.0, 28.0, 38.0, 47.0, 77.0, 144.0, 204.0, 403.0, 890.0, 2365.0, 9360.0, 83565.0, 650138.0, 270736.0, 23772.0, 4124.0, 1287.0, 569.0, 298.0, 163.0, 94.0, 67.0, 37.0, 33.0, 20.0, 17.0, 9.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.70147705078125, -1.6461181640625, -1.59075927734375, -1.535400390625, -1.48004150390625, -1.4246826171875, -1.36932373046875, -1.31396484375, -1.25860595703125, -1.2032470703125, -1.14788818359375, -1.092529296875, -1.03717041015625, -0.9818115234375, -0.92645263671875, -0.87109375, -0.81573486328125, -0.7603759765625, -0.70501708984375, -0.649658203125, -0.59429931640625, -0.5389404296875, -0.48358154296875, -0.42822265625, -0.37286376953125, -0.3175048828125, -0.26214599609375, -0.206787109375, -0.15142822265625, -0.0960693359375, -0.04071044921875, 0.0146484375, 0.07000732421875, 0.1253662109375, 0.18072509765625, 0.236083984375, 0.29144287109375, 0.3468017578125, 0.40216064453125, 0.45751953125, 0.51287841796875, 0.5682373046875, 0.62359619140625, 0.678955078125, 0.73431396484375, 0.7896728515625, 0.84503173828125, 0.900390625, 0.95574951171875, 1.0111083984375, 1.06646728515625, 1.121826171875, 1.17718505859375, 1.2325439453125, 1.28790283203125, 1.34326171875, 1.39862060546875, 1.4539794921875, 1.50933837890625, 1.564697265625, 1.62005615234375, 1.6754150390625, 1.73077392578125, 1.7861328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 10.0, 11.0, 15.0, 30.0, 34.0, 27.0, 51.0, 60.0, 65.0, 67.0, 99.0, 86.0, 75.0, 84.0, 74.0, 54.0, 44.0, 28.0, 25.0, 10.0, 9.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.16636085510253906, -0.16084671020507812, -0.1553325653076172, -0.14981842041015625, -0.1443042755126953, -0.13879013061523438, -0.13327598571777344, -0.1277618408203125, -0.12224769592285156, -0.11673355102539062, -0.11121940612792969, -0.10570526123046875, -0.10019111633300781, -0.09467697143554688, -0.08916282653808594, -0.083648681640625, -0.07813453674316406, -0.07262039184570312, -0.06710624694824219, -0.06159210205078125, -0.05607795715332031, -0.050563812255859375, -0.04504966735839844, -0.0395355224609375, -0.03402137756347656, -0.028507232666015625, -0.022993087768554688, -0.01747894287109375, -0.011964797973632812, -0.006450653076171875, -0.0009365081787109375, 0.00457763671875, 0.010091781616210938, 0.015605926513671875, 0.021120071411132812, 0.02663421630859375, 0.03214836120605469, 0.037662506103515625, 0.04317665100097656, 0.0486907958984375, 0.05420494079589844, 0.059719085693359375, 0.06523323059082031, 0.07074737548828125, 0.07626152038574219, 0.08177566528320312, 0.08728981018066406, 0.092803955078125, 0.09831809997558594, 0.10383224487304688, 0.10934638977050781, 0.11486053466796875, 0.12037467956542969, 0.12588882446289062, 0.13140296936035156, 0.1369171142578125, 0.14243125915527344, 0.14794540405273438, 0.1534595489501953, 0.15897369384765625, 0.1644878387451172, 0.17000198364257812, 0.17551612854003906, 0.1810302734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 9.0, 18.0, 30.0, 27.0, 36.0, 59.0, 65.0, 103.0, 173.0, 251.0, 434.0, 749.0, 1231.0, 2253.0, 4637.0, 10041.0, 23398.0, 55715.0, 132140.0, 258491.0, 280749.0, 157550.0, 68349.0, 28108.0, 12118.0, 5424.0, 2621.0, 1500.0, 802.0, 486.0, 305.0, 207.0, 140.0, 93.0, 84.0, 40.0, 29.0, 22.0, 17.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.50830078125, -0.4938240051269531, -0.47934722900390625, -0.4648704528808594, -0.4503936767578125, -0.4359169006347656, -0.42144012451171875, -0.4069633483886719, -0.392486572265625, -0.3780097961425781, -0.36353302001953125, -0.3490562438964844, -0.3345794677734375, -0.3201026916503906, -0.30562591552734375, -0.2911491394042969, -0.27667236328125, -0.2621955871582031, -0.24771881103515625, -0.23324203491210938, -0.2187652587890625, -0.20428848266601562, -0.18981170654296875, -0.17533493041992188, -0.160858154296875, -0.14638137817382812, -0.13190460205078125, -0.11742782592773438, -0.1029510498046875, -0.08847427368164062, -0.07399749755859375, -0.059520721435546875, -0.0450439453125, -0.030567169189453125, -0.01609039306640625, -0.001613616943359375, 0.0128631591796875, 0.027339935302734375, 0.04181671142578125, 0.056293487548828125, 0.070770263671875, 0.08524703979492188, 0.09972381591796875, 0.11420059204101562, 0.1286773681640625, 0.14315414428710938, 0.15763092041015625, 0.17210769653320312, 0.18658447265625, 0.20106124877929688, 0.21553802490234375, 0.23001480102539062, 0.2444915771484375, 0.2589683532714844, 0.27344512939453125, 0.2879219055175781, 0.302398681640625, 0.3168754577636719, 0.33135223388671875, 0.3458290100097656, 0.3603057861328125, 0.3747825622558594, 0.38925933837890625, 0.4037361145019531, 0.418212890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 13.0, 14.0, 19.0, 26.0, 28.0, 16.0, 35.0, 34.0, 29.0, 33.0, 35.0, 43.0, 42.0, 38.0, 51.0, 47.0, 47.0, 48.0, 43.0, 41.0, 53.0, 34.0, 42.0, 23.0, 28.0, 19.0, 18.0, 16.0, 12.0, 7.0, 15.0, 3.0, 6.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4711265563964844, -0.45616912841796875, -0.4412117004394531, -0.4262542724609375, -0.4112968444824219, -0.39633941650390625, -0.3813819885253906, -0.366424560546875, -0.3514671325683594, -0.33650970458984375, -0.3215522766113281, -0.3065948486328125, -0.2916374206542969, -0.27667999267578125, -0.2617225646972656, -0.24676513671875, -0.23180770874023438, -0.21685028076171875, -0.20189285278320312, -0.1869354248046875, -0.17197799682617188, -0.15702056884765625, -0.14206314086914062, -0.127105712890625, -0.11214828491210938, -0.09719085693359375, -0.08223342895507812, -0.0672760009765625, -0.052318572998046875, -0.03736114501953125, -0.022403717041015625, -0.0074462890625, 0.007511138916015625, 0.02246856689453125, 0.037425994873046875, 0.0523834228515625, 0.06734085083007812, 0.08229827880859375, 0.09725570678710938, 0.112213134765625, 0.12717056274414062, 0.14212799072265625, 0.15708541870117188, 0.1720428466796875, 0.18700027465820312, 0.20195770263671875, 0.21691513061523438, 0.23187255859375, 0.24682998657226562, 0.26178741455078125, 0.2767448425292969, 0.2917022705078125, 0.3066596984863281, 0.32161712646484375, 0.3365745544433594, 0.351531982421875, 0.3664894104003906, 0.38144683837890625, 0.3964042663574219, 0.4113616943359375, 0.4263191223144531, 0.44127655029296875, 0.4562339782714844, 0.47119140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 5.0, 20.0, 30.0, 34.0, 74.0, 146.0, 304.0, 724.0, 2074.0, 9897.0, 96603.0, 697332.0, 217942.0, 18652.0, 3040.0, 925.0, 359.0, 175.0, 89.0, 47.0, 32.0, 16.0, 9.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5841064453125, -0.563720703125, -0.5433349609375, -0.52294921875, -0.5025634765625, -0.482177734375, -0.4617919921875, -0.44140625, -0.4210205078125, -0.400634765625, -0.3802490234375, -0.35986328125, -0.3394775390625, -0.319091796875, -0.2987060546875, -0.2783203125, -0.2579345703125, -0.237548828125, -0.2171630859375, -0.19677734375, -0.1763916015625, -0.156005859375, -0.1356201171875, -0.115234375, -0.0948486328125, -0.074462890625, -0.0540771484375, -0.03369140625, -0.0133056640625, 0.007080078125, 0.0274658203125, 0.0478515625, 0.0682373046875, 0.088623046875, 0.1090087890625, 0.12939453125, 0.1497802734375, 0.170166015625, 0.1905517578125, 0.2109375, 0.2313232421875, 0.251708984375, 0.2720947265625, 0.29248046875, 0.3128662109375, 0.333251953125, 0.3536376953125, 0.3740234375, 0.3944091796875, 0.414794921875, 0.4351806640625, 0.45556640625, 0.4759521484375, 0.496337890625, 0.5167236328125, 0.537109375, 0.5574951171875, 0.577880859375, 0.5982666015625, 0.61865234375, 0.6390380859375, 0.659423828125, 0.6798095703125, 0.7001953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 12.0, 17.0, 20.0, 40.0, 59.0, 93.0, 160.0, 175.0, 148.0, 98.0, 57.0, 43.0, 28.0, 18.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001691579818725586, -0.00016463827341794968, -0.00016011856496334076, -0.00015559885650873184, -0.00015107914805412292, -0.000146559439599514, -0.0001420397311449051, -0.00013752002269029617, -0.00013300031423568726, -0.00012848060578107834, -0.00012396089732646942, -0.0001194411888718605, -0.00011492148041725159, -0.00011040177196264267, -0.00010588206350803375, -0.00010136235505342484, -9.684264659881592e-05, -9.2322938144207e-05, -8.780322968959808e-05, -8.328352123498917e-05, -7.876381278038025e-05, -7.424410432577133e-05, -6.972439587116241e-05, -6.52046874165535e-05, -6.068497896194458e-05, -5.616527050733566e-05, -5.1645562052726746e-05, -4.712585359811783e-05, -4.260614514350891e-05, -3.8086436688899994e-05, -3.356672823429108e-05, -2.904701977968216e-05, -2.4527311325073242e-05, -2.0007602870464325e-05, -1.5487894415855408e-05, -1.096818596124649e-05, -6.448477506637573e-06, -1.928769052028656e-06, 2.5909394025802612e-06, 7.1106478571891785e-06, 1.1630356311798096e-05, 1.6150064766407013e-05, 2.066977322101593e-05, 2.5189481675624847e-05, 2.9709190130233765e-05, 3.422889858484268e-05, 3.87486070394516e-05, 4.3268315494060516e-05, 4.7788023948669434e-05, 5.230773240327835e-05, 5.682744085788727e-05, 6.134714931249619e-05, 6.58668577671051e-05, 7.038656622171402e-05, 7.490627467632294e-05, 7.942598313093185e-05, 8.394569158554077e-05, 8.846540004014969e-05, 9.29851084947586e-05, 9.750481694936752e-05, 0.00010202452540397644, 0.00010654423385858536, 0.00011106394231319427, 0.00011558365076780319, 0.00012010335922241211]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 7.0, 12.0, 16.0, 27.0, 39.0, 83.0, 136.0, 243.0, 511.0, 1157.0, 3107.0, 9344.0, 35465.0, 184332.0, 546782.0, 211012.0, 40221.0, 10286.0, 3356.0, 1257.0, 574.0, 250.0, 132.0, 76.0, 45.0, 29.0, 20.0, 9.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36865234375, -0.3552665710449219, -0.34188079833984375, -0.3284950256347656, -0.3151092529296875, -0.3017234802246094, -0.28833770751953125, -0.2749519348144531, -0.261566162109375, -0.24818038940429688, -0.23479461669921875, -0.22140884399414062, -0.2080230712890625, -0.19463729858398438, -0.18125152587890625, -0.16786575317382812, -0.15447998046875, -0.14109420776367188, -0.12770843505859375, -0.11432266235351562, -0.1009368896484375, -0.08755111694335938, -0.07416534423828125, -0.060779571533203125, -0.047393798828125, -0.034008026123046875, -0.02062225341796875, -0.007236480712890625, 0.0061492919921875, 0.019535064697265625, 0.03292083740234375, 0.046306610107421875, 0.0596923828125, 0.07307815551757812, 0.08646392822265625, 0.09984970092773438, 0.1132354736328125, 0.12662124633789062, 0.14000701904296875, 0.15339279174804688, 0.166778564453125, 0.18016433715820312, 0.19355010986328125, 0.20693588256835938, 0.2203216552734375, 0.23370742797851562, 0.24709320068359375, 0.2604789733886719, 0.27386474609375, 0.2872505187988281, 0.30063629150390625, 0.3140220642089844, 0.3274078369140625, 0.3407936096191406, 0.35417938232421875, 0.3675651550292969, 0.380950927734375, 0.3943367004394531, 0.40772247314453125, 0.4211082458496094, 0.4344940185546875, 0.4478797912597656, 0.46126556396484375, 0.4746513366699219, 0.488037109375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 9.0, 7.0, 7.0, 12.0, 15.0, 30.0, 33.0, 45.0, 48.0, 65.0, 97.0, 108.0, 100.0, 94.0, 85.0, 69.0, 50.0, 37.0, 28.0, 18.0, 10.0, 12.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.51416015625, -0.5027713775634766, -0.4913825988769531, -0.4799938201904297, -0.46860504150390625, -0.4572162628173828, -0.4458274841308594, -0.43443870544433594, -0.4230499267578125, -0.41166114807128906, -0.4002723693847656, -0.3888835906982422, -0.37749481201171875, -0.3661060333251953, -0.3547172546386719, -0.34332847595214844, -0.331939697265625, -0.32055091857910156, -0.3091621398925781, -0.2977733612060547, -0.28638458251953125, -0.2749958038330078, -0.2636070251464844, -0.25221824645996094, -0.2408294677734375, -0.22944068908691406, -0.21805191040039062, -0.2066631317138672, -0.19527435302734375, -0.1838855743408203, -0.17249679565429688, -0.16110801696777344, -0.14971923828125, -0.13833045959472656, -0.12694168090820312, -0.11555290222167969, -0.10416412353515625, -0.09277534484863281, -0.08138656616210938, -0.06999778747558594, -0.0586090087890625, -0.04722023010253906, -0.035831451416015625, -0.024442672729492188, -0.01305389404296875, -0.0016651153564453125, 0.009723663330078125, 0.021112442016601562, 0.032501220703125, 0.04388999938964844, 0.055278778076171875, 0.06666755676269531, 0.07805633544921875, 0.08944511413574219, 0.10083389282226562, 0.11222267150878906, 0.1236114501953125, 0.13500022888183594, 0.14638900756835938, 0.1577777862548828, 0.16916656494140625, 0.1805553436279297, 0.19194412231445312, 0.20333290100097656, 0.2147216796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 11.0, 33.0, 73.0, 161.0, 242.0, 237.0, 129.0, 76.0, 28.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.384471893310547, -12.057840347290039, -11.731209754943848, -11.40457820892334, -11.077946662902832, -10.751315116882324, -10.424684524536133, -10.098052978515625, -9.771421432495117, -9.44478988647461, -9.118159294128418, -8.79152774810791, -8.464896202087402, -8.138264656066895, -7.811634063720703, -7.485002517700195, -7.158371448516846, -6.831740379333496, -6.505108833312988, -6.178477764129639, -5.851846218109131, -5.525215148925781, -5.198583602905273, -4.871952533721924, -4.545321464538574, -4.218690395355225, -3.892058849334717, -3.565427780151367, -3.2387962341308594, -2.9121651649475098, -2.585533857345581, -2.2589025497436523, -1.9322710037231445, -1.6056396961212158, -1.279008388519287, -0.952377200126648, -0.6257458925247192, -0.2991145849227905, 0.027516603469848633, 0.35414791107177734, 0.680779218673706, 1.0074105262756348, 1.3340418338775635, 1.6606730222702026, 1.9873043298721313, 2.3139357566833496, 2.640566825866699, 2.967198133468628, 3.2938294410705566, 3.6204607486724854, 3.947092056274414, 4.273723125457764, 4.6003546714782715, 4.926985740661621, 5.253617286682129, 5.5802483558654785, 5.906879425048828, 6.233510494232178, 6.5601420402526855, 6.886773109436035, 7.213404655456543, 7.540035724639893, 7.866666793823242, 8.19329833984375, 8.519929885864258]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 8.0, 9.0, 6.0, 11.0, 8.0, 21.0, 27.0, 29.0, 31.0, 32.0, 37.0, 34.0, 42.0, 47.0, 43.0, 41.0, 53.0, 46.0, 45.0, 41.0, 54.0, 48.0, 45.0, 45.0, 20.0, 31.0, 21.0, 19.0, 18.0, 13.0, 18.0, 8.0, 15.0, 6.0, 6.0, 4.0, 5.0, 1.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.027097702026367, -2.935706853866577, -2.844316005706787, -2.752925157546997, -2.661534309387207, -2.570143699645996, -2.478752851486206, -2.387362003326416, -2.295971155166626, -2.204580307006836, -2.113189458847046, -2.021798610687256, -1.9304078817367554, -1.8390170335769653, -1.7476263046264648, -1.6562354564666748, -1.5648446083068848, -1.4734537601470947, -1.3820629119873047, -1.2906721830368042, -1.1992813348770142, -1.1078904867172241, -1.0164997577667236, -0.9251089096069336, -0.8337180614471436, -0.7423272132873535, -0.6509364247322083, -0.559545636177063, -0.46815478801727295, -0.3767639696598053, -0.28537315130233765, -0.19398236274719238, -0.10259175300598145, -0.011200934648513794, 0.08018988370895386, 0.1715807020664215, 0.26297152042388916, 0.3543623387813568, 0.44575315713882446, 0.5371439456939697, 0.6285347938537598, 0.7199256420135498, 0.8113164305686951, 0.9027072191238403, 0.9940980672836304, 1.0854889154434204, 1.176879644393921, 1.268270492553711, 1.359661340713501, 1.451052188873291, 1.542443037033081, 1.6338337659835815, 1.7252246141433716, 1.8166154623031616, 1.908006191253662, 1.9993970394134521, 2.090787887573242, 2.1821787357330322, 2.2735695838928223, 2.3649604320526123, 2.4563512802124023, 2.5477418899536133, 2.6391327381134033, 2.7305235862731934, 2.8219144344329834]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 14.0, 18.0, 15.0, 25.0, 38.0, 78.0, 88.0, 128.0, 235.0, 411.0, 894.0, 2292.0, 6879.0, 35716.0, 1520181.0, 2576214.0, 39744.0, 7089.0, 2156.0, 921.0, 393.0, 237.0, 147.0, 102.0, 55.0, 29.0, 28.0, 21.0, 26.0, 21.0, 17.0, 9.0, 5.0, 5.0, 9.0, 4.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.3623046875, -1.3118896484375, -1.261474609375, -1.2110595703125, -1.16064453125, -1.1102294921875, -1.059814453125, -1.0093994140625, -0.958984375, -0.9085693359375, -0.858154296875, -0.8077392578125, -0.75732421875, -0.7069091796875, -0.656494140625, -0.6060791015625, -0.5556640625, -0.5052490234375, -0.454833984375, -0.4044189453125, -0.35400390625, -0.3035888671875, -0.253173828125, -0.2027587890625, -0.15234375, -0.1019287109375, -0.051513671875, -0.0010986328125, 0.04931640625, 0.0997314453125, 0.150146484375, 0.2005615234375, 0.2509765625, 0.3013916015625, 0.351806640625, 0.4022216796875, 0.45263671875, 0.5030517578125, 0.553466796875, 0.6038818359375, 0.654296875, 0.7047119140625, 0.755126953125, 0.8055419921875, 0.85595703125, 0.9063720703125, 0.956787109375, 1.0072021484375, 1.0576171875, 1.1080322265625, 1.158447265625, 1.2088623046875, 1.25927734375, 1.3096923828125, 1.360107421875, 1.4105224609375, 1.4609375, 1.5113525390625, 1.561767578125, 1.6121826171875, 1.66259765625, 1.7130126953125, 1.763427734375, 1.8138427734375, 1.8642578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 11.0, 11.0, 12.0, 13.0, 16.0, 26.0, 34.0, 45.0, 60.0, 63.0, 69.0, 79.0, 77.0, 77.0, 81.0, 72.0, 61.0, 32.0, 40.0, 42.0, 25.0, 21.0, 15.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.206787109375, -0.2008342742919922, -0.19488143920898438, -0.18892860412597656, -0.18297576904296875, -0.17702293395996094, -0.17107009887695312, -0.1651172637939453, -0.1591644287109375, -0.1532115936279297, -0.14725875854492188, -0.14130592346191406, -0.13535308837890625, -0.12940025329589844, -0.12344741821289062, -0.11749458312988281, -0.111541748046875, -0.10558891296386719, -0.09963607788085938, -0.09368324279785156, -0.08773040771484375, -0.08177757263183594, -0.07582473754882812, -0.06987190246582031, -0.0639190673828125, -0.05796623229980469, -0.052013397216796875, -0.04606056213378906, -0.04010772705078125, -0.03415489196777344, -0.028202056884765625, -0.022249221801757812, -0.01629638671875, -0.010343551635742188, -0.004390716552734375, 0.0015621185302734375, 0.00751495361328125, 0.013467788696289062, 0.019420623779296875, 0.025373458862304688, 0.0313262939453125, 0.03727912902832031, 0.043231964111328125, 0.04918479919433594, 0.05513763427734375, 0.06109046936035156, 0.06704330444335938, 0.07299613952636719, 0.078948974609375, 0.08490180969238281, 0.09085464477539062, 0.09680747985839844, 0.10276031494140625, 0.10871315002441406, 0.11466598510742188, 0.12061882019042969, 0.1265716552734375, 0.1325244903564453, 0.13847732543945312, 0.14443016052246094, 0.15038299560546875, 0.15633583068847656, 0.16228866577148438, 0.1682415008544922, 0.1741943359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 15.0, 19.0, 29.0, 47.0, 60.0, 94.0, 141.0, 219.0, 410.0, 790.0, 1706.0, 4411.0, 13292.0, 53741.0, 480828.0, 3385990.0, 205006.0, 32497.0, 8986.0, 3174.0, 1344.0, 606.0, 332.0, 192.0, 131.0, 69.0, 41.0, 26.0, 28.0, 15.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.99951171875, -0.9695358276367188, -0.9395599365234375, -0.9095840454101562, -0.879608154296875, -0.8496322631835938, -0.8196563720703125, -0.7896804809570312, -0.75970458984375, -0.7297286987304688, -0.6997528076171875, -0.6697769165039062, -0.639801025390625, -0.6098251342773438, -0.5798492431640625, -0.5498733520507812, -0.5198974609375, -0.48992156982421875, -0.4599456787109375, -0.42996978759765625, -0.399993896484375, -0.37001800537109375, -0.3400421142578125, -0.31006622314453125, -0.28009033203125, -0.25011444091796875, -0.2201385498046875, -0.19016265869140625, -0.160186767578125, -0.13021087646484375, -0.1002349853515625, -0.07025909423828125, -0.040283203125, -0.01030731201171875, 0.0196685791015625, 0.04964447021484375, 0.079620361328125, 0.10959625244140625, 0.1395721435546875, 0.16954803466796875, 0.19952392578125, 0.22949981689453125, 0.2594757080078125, 0.28945159912109375, 0.319427490234375, 0.34940338134765625, 0.3793792724609375, 0.40935516357421875, 0.4393310546875, 0.46930694580078125, 0.4992828369140625, 0.5292587280273438, 0.559234619140625, 0.5892105102539062, 0.6191864013671875, 0.6491622924804688, 0.67913818359375, 0.7091140747070312, 0.7390899658203125, 0.7690658569335938, 0.799041748046875, 0.8290176391601562, 0.8589935302734375, 0.8889694213867188, 0.9189453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 8.0, 3.0, 11.0, 11.0, 23.0, 23.0, 45.0, 56.0, 107.0, 195.0, 423.0, 1112.0, 1133.0, 436.0, 204.0, 112.0, 53.0, 38.0, 23.0, 14.0, 15.0, 7.0, 1.0, 1.0, 5.0, 7.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.4213218688964844, -0.40856170654296875, -0.3958015441894531, -0.3830413818359375, -0.3702812194824219, -0.35752105712890625, -0.3447608947753906, -0.332000732421875, -0.3192405700683594, -0.30648040771484375, -0.2937202453613281, -0.2809600830078125, -0.2681999206542969, -0.25543975830078125, -0.24267959594726562, -0.22991943359375, -0.21715927124023438, -0.20439910888671875, -0.19163894653320312, -0.1788787841796875, -0.16611862182617188, -0.15335845947265625, -0.14059829711914062, -0.127838134765625, -0.11507797241210938, -0.10231781005859375, -0.08955764770507812, -0.0767974853515625, -0.06403732299804688, -0.05127716064453125, -0.038516998291015625, -0.0257568359375, -0.012996673583984375, -0.00023651123046875, 0.012523651123046875, 0.0252838134765625, 0.038043975830078125, 0.05080413818359375, 0.06356430053710938, 0.076324462890625, 0.08908462524414062, 0.10184478759765625, 0.11460494995117188, 0.1273651123046875, 0.14012527465820312, 0.15288543701171875, 0.16564559936523438, 0.17840576171875, 0.19116592407226562, 0.20392608642578125, 0.21668624877929688, 0.2294464111328125, 0.24220657348632812, 0.25496673583984375, 0.2677268981933594, 0.280487060546875, 0.2932472229003906, 0.30600738525390625, 0.3187675476074219, 0.3315277099609375, 0.3442878723144531, 0.35704803466796875, 0.3698081970214844, 0.382568359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 9.0, 18.0, 41.0, 78.0, 128.0, 177.0, 191.0, 153.0, 99.0, 52.0, 24.0, 12.0, 8.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.024954795837402, -3.914379358291626, -3.8038036823272705, -3.693228244781494, -3.5826528072357178, -3.4720771312713623, -3.361501693725586, -3.2509260177612305, -3.140350580215454, -3.0297751426696777, -2.9191994667053223, -2.808624029159546, -2.6980485916137695, -2.587472915649414, -2.4768974781036377, -2.3663220405578613, -2.255746364593506, -2.1451709270477295, -2.034595251083374, -1.9240198135375977, -1.8134442567825317, -1.7028687000274658, -1.5922932624816895, -1.4817177057266235, -1.3711423873901367, -1.2605668306350708, -1.1499913930892944, -1.0394158363342285, -0.9288402795791626, -0.8182647824287415, -0.7076892852783203, -0.5971137285232544, -0.4865381717681885, -0.37596264481544495, -0.2653871178627014, -0.15481162071228027, -0.04423609375953674, 0.06633943319320679, 0.17691493034362793, 0.28749048709869385, 0.398065984249115, 0.5086414813995361, 0.619217038154602, 0.7297925353050232, 0.8403680324554443, 0.9509435892105103, 1.0615191459655762, 1.1720945835113525, 1.2826701402664185, 1.3932456970214844, 1.5038211345672607, 1.6143966913223267, 1.7249722480773926, 1.835547685623169, 1.9461232423782349, 2.056698799133301, 2.167274236679077, 2.2778496742248535, 2.388425350189209, 2.4990007877349854, 2.6095762252807617, 2.720151901245117, 2.8307273387908936, 2.94130277633667, 3.0518784523010254]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 14.0, 9.0, 22.0, 28.0, 30.0, 35.0, 39.0, 43.0, 53.0, 56.0, 48.0, 63.0, 59.0, 63.0, 55.0, 62.0, 60.0, 51.0, 42.0, 40.0, 33.0, 19.0, 18.0, 20.0, 11.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0796396732330322, -1.031628131866455, -0.9836165904998779, -0.9356050491333008, -0.8875934481620789, -0.8395819067955017, -0.7915703654289246, -0.7435587644577026, -0.6955472230911255, -0.6475356817245483, -0.5995241403579712, -0.551512598991394, -0.5035009980201721, -0.45548945665359497, -0.4074779152870178, -0.3594663441181183, -0.3114548325538635, -0.2634432911872864, -0.21543172001838684, -0.1674201786518097, -0.11940862238407135, -0.07139706611633301, -0.02338552474975586, 0.024626046419143677, 0.07263758778572083, 0.12064914405345917, 0.1686607003211975, 0.21667224168777466, 0.2646837830543518, 0.31269535422325134, 0.3607068955898285, 0.408718466758728, 0.4567300081253052, 0.5047415494918823, 0.5527530908584595, 0.6007646322250366, 0.6487762331962585, 0.6967877745628357, 0.7447993159294128, 0.7928109169006348, 0.8408224582672119, 0.8888339996337891, 0.9368455410003662, 0.9848570823669434, 1.0328686237335205, 1.0808801651000977, 1.1288917064666748, 1.1769033670425415, 1.224914789199829, 1.2729263305664062, 1.3209378719329834, 1.3689494132995605, 1.4169609546661377, 1.4649724960327148, 1.512984037399292, 1.5609956979751587, 1.6090072393417358, 1.657018780708313, 1.7050303220748901, 1.7530418634414673, 1.8010534048080444, 1.8490650653839111, 1.8970766067504883, 1.9450881481170654, 1.9930996894836426]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 6.0, 14.0, 21.0, 30.0, 81.0, 171.0, 351.0, 895.0, 3978.0, 42085.0, 829365.0, 160761.0, 8287.0, 1573.0, 490.0, 177.0, 105.0, 58.0, 26.0, 25.0, 11.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -3.0137939453125, -2.933837890625, -2.8538818359375, -2.77392578125, -2.6939697265625, -2.614013671875, -2.5340576171875, -2.4541015625, -2.3741455078125, -2.294189453125, -2.2142333984375, -2.13427734375, -2.0543212890625, -1.974365234375, -1.8944091796875, -1.814453125, -1.7344970703125, -1.654541015625, -1.5745849609375, -1.49462890625, -1.4146728515625, -1.334716796875, -1.2547607421875, -1.1748046875, -1.0948486328125, -1.014892578125, -0.9349365234375, -0.85498046875, -0.7750244140625, -0.695068359375, -0.6151123046875, -0.53515625, -0.4552001953125, -0.375244140625, -0.2952880859375, -0.21533203125, -0.1353759765625, -0.055419921875, 0.0245361328125, 0.1044921875, 0.1844482421875, 0.264404296875, 0.3443603515625, 0.42431640625, 0.5042724609375, 0.584228515625, 0.6641845703125, 0.744140625, 0.8240966796875, 0.904052734375, 0.9840087890625, 1.06396484375, 1.1439208984375, 1.223876953125, 1.3038330078125, 1.3837890625, 1.4637451171875, 1.543701171875, 1.6236572265625, 1.70361328125, 1.7835693359375, 1.863525390625, 1.9434814453125, 2.0234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 12.0, 9.0, 9.0, 18.0, 21.0, 29.0, 36.0, 45.0, 43.0, 50.0, 58.0, 64.0, 76.0, 58.0, 66.0, 52.0, 63.0, 49.0, 43.0, 43.0, 34.0, 16.0, 23.0, 23.0, 15.0, 13.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.151611328125, -0.14647293090820312, -0.14133453369140625, -0.13619613647460938, -0.1310577392578125, -0.12591934204101562, -0.12078094482421875, -0.11564254760742188, -0.110504150390625, -0.10536575317382812, -0.10022735595703125, -0.09508895874023438, -0.0899505615234375, -0.08481216430664062, -0.07967376708984375, -0.07453536987304688, -0.06939697265625, -0.06425857543945312, -0.05912017822265625, -0.053981781005859375, -0.0488433837890625, -0.043704986572265625, -0.03856658935546875, -0.033428192138671875, -0.028289794921875, -0.023151397705078125, -0.01801300048828125, -0.012874603271484375, -0.0077362060546875, -0.002597808837890625, 0.00254058837890625, 0.007678985595703125, 0.0128173828125, 0.017955780029296875, 0.02309417724609375, 0.028232574462890625, 0.0333709716796875, 0.038509368896484375, 0.04364776611328125, 0.048786163330078125, 0.053924560546875, 0.059062957763671875, 0.06420135498046875, 0.06933975219726562, 0.0744781494140625, 0.07961654663085938, 0.08475494384765625, 0.08989334106445312, 0.09503173828125, 0.10017013549804688, 0.10530853271484375, 0.11044692993164062, 0.1155853271484375, 0.12072372436523438, 0.12586212158203125, 0.13100051879882812, 0.136138916015625, 0.14127731323242188, 0.14641571044921875, 0.15155410766601562, 0.1566925048828125, 0.16183090209960938, 0.16696929931640625, 0.17210769653320312, 0.17724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 7.0, 11.0, 17.0, 18.0, 37.0, 40.0, 56.0, 85.0, 106.0, 152.0, 269.0, 380.0, 622.0, 1118.0, 2135.0, 4391.0, 10197.0, 25462.0, 68735.0, 192506.0, 377285.0, 229317.0, 82264.0, 30556.0, 11846.0, 5099.0, 2536.0, 1281.0, 721.0, 399.0, 265.0, 163.0, 124.0, 92.0, 64.0, 50.0, 38.0, 29.0, 19.0, 16.0, 11.0, 2.0, 7.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4580078125, -0.4407806396484375, -0.423553466796875, -0.4063262939453125, -0.38909912109375, -0.3718719482421875, -0.354644775390625, -0.3374176025390625, -0.3201904296875, -0.3029632568359375, -0.285736083984375, -0.2685089111328125, -0.25128173828125, -0.2340545654296875, -0.216827392578125, -0.1996002197265625, -0.182373046875, -0.1651458740234375, -0.147918701171875, -0.1306915283203125, -0.11346435546875, -0.0962371826171875, -0.079010009765625, -0.0617828369140625, -0.0445556640625, -0.0273284912109375, -0.010101318359375, 0.0071258544921875, 0.02435302734375, 0.0415802001953125, 0.058807373046875, 0.0760345458984375, 0.09326171875, 0.1104888916015625, 0.127716064453125, 0.1449432373046875, 0.16217041015625, 0.1793975830078125, 0.196624755859375, 0.2138519287109375, 0.2310791015625, 0.2483062744140625, 0.265533447265625, 0.2827606201171875, 0.29998779296875, 0.3172149658203125, 0.334442138671875, 0.3516693115234375, 0.368896484375, 0.3861236572265625, 0.403350830078125, 0.4205780029296875, 0.43780517578125, 0.4550323486328125, 0.472259521484375, 0.4894866943359375, 0.5067138671875, 0.5239410400390625, 0.541168212890625, 0.5583953857421875, 0.57562255859375, 0.5928497314453125, 0.610076904296875, 0.6273040771484375, 0.64453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 14.0, 13.0, 18.0, 22.0, 30.0, 23.0, 32.0, 36.0, 40.0, 43.0, 41.0, 44.0, 56.0, 49.0, 42.0, 39.0, 45.0, 50.0, 44.0, 34.0, 29.0, 33.0, 29.0, 21.0, 19.0, 17.0, 14.0, 10.0, 10.0, 13.0, 15.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.552734375, -0.5361099243164062, -0.5194854736328125, -0.5028610229492188, -0.486236572265625, -0.46961212158203125, -0.4529876708984375, -0.43636322021484375, -0.41973876953125, -0.40311431884765625, -0.3864898681640625, -0.36986541748046875, -0.353240966796875, -0.33661651611328125, -0.3199920654296875, -0.30336761474609375, -0.2867431640625, -0.27011871337890625, -0.2534942626953125, -0.23686981201171875, -0.220245361328125, -0.20362091064453125, -0.1869964599609375, -0.17037200927734375, -0.15374755859375, -0.13712310791015625, -0.1204986572265625, -0.10387420654296875, -0.087249755859375, -0.07062530517578125, -0.0540008544921875, -0.03737640380859375, -0.020751953125, -0.00412750244140625, 0.0124969482421875, 0.02912139892578125, 0.045745849609375, 0.06237030029296875, 0.0789947509765625, 0.09561920166015625, 0.11224365234375, 0.12886810302734375, 0.1454925537109375, 0.16211700439453125, 0.178741455078125, 0.19536590576171875, 0.2119903564453125, 0.22861480712890625, 0.2452392578125, 0.26186370849609375, 0.2784881591796875, 0.29511260986328125, 0.311737060546875, 0.32836151123046875, 0.3449859619140625, 0.36161041259765625, 0.37823486328125, 0.39485931396484375, 0.4114837646484375, 0.42810821533203125, 0.444732666015625, 0.46135711669921875, 0.4779815673828125, 0.49460601806640625, 0.51123046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 13.0, 36.0, 40.0, 75.0, 248.0, 613.0, 2343.0, 17963.0, 639095.0, 373130.0, 12323.0, 1843.0, 462.0, 192.0, 76.0, 43.0, 22.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7822265625, -0.7508392333984375, -0.719451904296875, -0.6880645751953125, -0.65667724609375, -0.6252899169921875, -0.593902587890625, -0.5625152587890625, -0.5311279296875, -0.4997406005859375, -0.468353271484375, -0.4369659423828125, -0.40557861328125, -0.3741912841796875, -0.342803955078125, -0.3114166259765625, -0.280029296875, -0.2486419677734375, -0.217254638671875, -0.1858673095703125, -0.15447998046875, -0.1230926513671875, -0.091705322265625, -0.0603179931640625, -0.0289306640625, 0.0024566650390625, 0.033843994140625, 0.0652313232421875, 0.09661865234375, 0.1280059814453125, 0.159393310546875, 0.1907806396484375, 0.22216796875, 0.2535552978515625, 0.284942626953125, 0.3163299560546875, 0.34771728515625, 0.3791046142578125, 0.410491943359375, 0.4418792724609375, 0.4732666015625, 0.5046539306640625, 0.536041259765625, 0.5674285888671875, 0.59881591796875, 0.6302032470703125, 0.661590576171875, 0.6929779052734375, 0.724365234375, 0.7557525634765625, 0.787139892578125, 0.8185272216796875, 0.84991455078125, 0.8813018798828125, 0.912689208984375, 0.9440765380859375, 0.9754638671875, 1.0068511962890625, 1.038238525390625, 1.0696258544921875, 1.10101318359375, 1.1324005126953125, 1.163787841796875, 1.1951751708984375, 1.2265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 7.0, 7.0, 18.0, 12.0, 22.0, 29.0, 40.0, 65.0, 69.0, 103.0, 119.0, 136.0, 114.0, 75.0, 56.0, 37.0, 22.0, 17.0, 9.0, 12.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010758638381958008, -0.00010449253022670746, -0.00010139867663383484, -9.830482304096222e-05, -9.52109694480896e-05, -9.211711585521698e-05, -8.902326226234436e-05, -8.592940866947174e-05, -8.283555507659912e-05, -7.97417014837265e-05, -7.664784789085388e-05, -7.355399429798126e-05, -7.046014070510864e-05, -6.736628711223602e-05, -6.42724335193634e-05, -6.117857992649078e-05, -5.8084726333618164e-05, -5.4990872740745544e-05, -5.1897019147872925e-05, -4.8803165555000305e-05, -4.5709311962127686e-05, -4.2615458369255066e-05, -3.9521604776382446e-05, -3.642775118350983e-05, -3.333389759063721e-05, -3.0240043997764587e-05, -2.7146190404891968e-05, -2.4052336812019348e-05, -2.095848321914673e-05, -1.786462962627411e-05, -1.477077603340149e-05, -1.167692244052887e-05, -8.58306884765625e-06, -5.48921525478363e-06, -2.3953616619110107e-06, 6.984919309616089e-07, 3.7923455238342285e-06, 6.886199116706848e-06, 9.980052709579468e-06, 1.3073906302452087e-05, 1.6167759895324707e-05, 1.9261613488197327e-05, 2.2355467081069946e-05, 2.5449320673942566e-05, 2.8543174266815186e-05, 3.1637027859687805e-05, 3.4730881452560425e-05, 3.7824735045433044e-05, 4.0918588638305664e-05, 4.4012442231178284e-05, 4.71062958240509e-05, 5.020014941692352e-05, 5.329400300979614e-05, 5.638785660266876e-05, 5.948171019554138e-05, 6.2575563788414e-05, 6.566941738128662e-05, 6.876327097415924e-05, 7.185712456703186e-05, 7.495097815990448e-05, 7.80448317527771e-05, 8.113868534564972e-05, 8.423253893852234e-05, 8.732639253139496e-05, 9.042024612426758e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 20.0, 47.0, 87.0, 188.0, 568.0, 3607.0, 134377.0, 898353.0, 9863.0, 959.0, 272.0, 102.0, 58.0, 17.0, 18.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.341278076171875, -1.28802490234375, -1.234771728515625, -1.1815185546875, -1.128265380859375, -1.07501220703125, -1.021759033203125, -0.968505859375, -0.915252685546875, -0.86199951171875, -0.808746337890625, -0.7554931640625, -0.702239990234375, -0.64898681640625, -0.595733642578125, -0.54248046875, -0.489227294921875, -0.43597412109375, -0.382720947265625, -0.3294677734375, -0.276214599609375, -0.22296142578125, -0.169708251953125, -0.116455078125, -0.063201904296875, -0.00994873046875, 0.043304443359375, 0.0965576171875, 0.149810791015625, 0.20306396484375, 0.256317138671875, 0.3095703125, 0.362823486328125, 0.41607666015625, 0.469329833984375, 0.5225830078125, 0.575836181640625, 0.62908935546875, 0.682342529296875, 0.735595703125, 0.788848876953125, 0.84210205078125, 0.895355224609375, 0.9486083984375, 1.001861572265625, 1.05511474609375, 1.108367919921875, 1.16162109375, 1.214874267578125, 1.26812744140625, 1.321380615234375, 1.3746337890625, 1.427886962890625, 1.48114013671875, 1.534393310546875, 1.587646484375, 1.640899658203125, 1.69415283203125, 1.747406005859375, 1.8006591796875, 1.853912353515625, 1.90716552734375, 1.960418701171875, 2.013671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 12.0, 18.0, 45.0, 79.0, 174.0, 245.0, 201.0, 103.0, 46.0, 30.0, 11.0, 15.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6588821411132812, -0.6331939697265625, -0.6075057983398438, -0.581817626953125, -0.5561294555664062, -0.5304412841796875, -0.5047531127929688, -0.47906494140625, -0.45337677001953125, -0.4276885986328125, -0.40200042724609375, -0.376312255859375, -0.35062408447265625, -0.3249359130859375, -0.29924774169921875, -0.2735595703125, -0.24787139892578125, -0.2221832275390625, -0.19649505615234375, -0.170806884765625, -0.14511871337890625, -0.1194305419921875, -0.09374237060546875, -0.06805419921875, -0.04236602783203125, -0.0166778564453125, 0.00901031494140625, 0.034698486328125, 0.06038665771484375, 0.0860748291015625, 0.11176300048828125, 0.137451171875, 0.16313934326171875, 0.1888275146484375, 0.21451568603515625, 0.240203857421875, 0.26589202880859375, 0.2915802001953125, 0.31726837158203125, 0.34295654296875, 0.36864471435546875, 0.3943328857421875, 0.42002105712890625, 0.445709228515625, 0.47139739990234375, 0.4970855712890625, 0.5227737426757812, 0.5484619140625, 0.5741500854492188, 0.5998382568359375, 0.6255264282226562, 0.651214599609375, 0.6769027709960938, 0.7025909423828125, 0.7282791137695312, 0.75396728515625, 0.7796554565429688, 0.8053436279296875, 0.8310317993164062, 0.856719970703125, 0.8824081420898438, 0.9080963134765625, 0.9337844848632812, 0.95947265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 23.0, 65.0, 132.0, 273.0, 232.0, 162.0, 70.0, 28.0, 12.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.694255828857422, -16.331281661987305, -15.968308448791504, -15.605334281921387, -15.24236011505127, -14.879386901855469, -14.516412734985352, -14.153438568115234, -13.790464401245117, -13.427490234375, -13.0645170211792, -12.701542854309082, -12.338568687438965, -11.975595474243164, -11.612621307373047, -11.24964714050293, -10.886673927307129, -10.523699760437012, -10.160726547241211, -9.797752380371094, -9.434778213500977, -9.07180404663086, -8.708830833435059, -8.345856666564941, -7.982882976531982, -7.619909286499023, -7.256935119628906, -6.893961429595947, -6.530987739562988, -6.168013572692871, -5.805039882659912, -5.442066192626953, -5.079092025756836, -4.716118335723877, -4.35314416885376, -3.990170478820801, -3.6271965503692627, -3.2642226219177246, -2.9012489318847656, -2.5382750034332275, -2.1753010749816895, -1.8123271465301514, -1.4493533372879028, -1.0863795280456543, -0.7234055995941162, -0.3604316711425781, 0.0025420188903808594, 0.36551594734191895, 0.728489875793457, 1.0914638042449951, 1.4544376134872437, 1.8174114227294922, 2.1803853511810303, 2.5433592796325684, 2.9063329696655273, 3.2693068981170654, 3.6322808265686035, 3.9952547550201416, 4.35822868347168, 4.721202373504639, 5.084176063537598, 5.447150230407715, 5.810123920440674, 6.173097610473633, 6.53607177734375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 3.0, 10.0, 5.0, 7.0, 4.0, 11.0, 8.0, 24.0, 16.0, 25.0, 29.0, 36.0, 37.0, 21.0, 25.0, 37.0, 38.0, 44.0, 49.0, 46.0, 49.0, 47.0, 56.0, 45.0, 38.0, 42.0, 25.0, 34.0, 23.0, 23.0, 19.0, 22.0, 14.0, 17.0, 11.0, 13.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.9814746379852295, -2.891805648803711, -2.8021366596221924, -2.712467670440674, -2.622798442840576, -2.5331294536590576, -2.443460464477539, -2.3537914752960205, -2.264122486114502, -2.1744534969329834, -2.084784507751465, -1.9951153993606567, -1.9054462909698486, -1.81577730178833, -1.7261083126068115, -1.636439323425293, -1.5467700958251953, -1.4571011066436768, -1.3674319982528687, -1.27776300907135, -1.188093900680542, -1.0984249114990234, -1.0087559223175049, -0.9190868735313416, -0.8294178247451782, -0.7397487759590149, -0.6500797271728516, -0.560410737991333, -0.4707416892051697, -0.38107264041900635, -0.2914036512374878, -0.20173460245132446, -0.11206579208374023, -0.022396758198738098, 0.06727227568626404, 0.15694129467010498, 0.2466103434562683, 0.33627939224243164, 0.4259483814239502, 0.5156174302101135, 0.6052864789962769, 0.6949555277824402, 0.7846245765686035, 0.8742935657501221, 0.9639626145362854, 1.0536316633224487, 1.1433006525039673, 1.2329697608947754, 1.322638750076294, 1.4123077392578125, 1.5019768476486206, 1.5916458368301392, 1.6813149452209473, 1.7709839344024658, 1.8606529235839844, 1.950321912765503, 2.0399909019470215, 2.12965989112854, 2.2193288803100586, 2.3089981079101562, 2.398667097091675, 2.4883360862731934, 2.578005075454712, 2.6676740646362305, 2.757343292236328]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 8.0, 24.0, 32.0, 35.0, 63.0, 140.0, 273.0, 783.0, 2825.0, 20971.0, 3849465.0, 307218.0, 9800.0, 1639.0, 499.0, 198.0, 111.0, 49.0, 42.0, 24.0, 16.0, 16.0, 7.0, 12.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.94512939453125, -1.8668212890625, -1.78851318359375, -1.710205078125, -1.63189697265625, -1.5535888671875, -1.47528076171875, -1.39697265625, -1.31866455078125, -1.2403564453125, -1.16204833984375, -1.083740234375, -1.00543212890625, -0.9271240234375, -0.84881591796875, -0.7705078125, -0.69219970703125, -0.6138916015625, -0.53558349609375, -0.457275390625, -0.37896728515625, -0.3006591796875, -0.22235107421875, -0.14404296875, -0.06573486328125, 0.0125732421875, 0.09088134765625, 0.169189453125, 0.24749755859375, 0.3258056640625, 0.40411376953125, 0.482421875, 0.56072998046875, 0.6390380859375, 0.71734619140625, 0.795654296875, 0.87396240234375, 0.9522705078125, 1.03057861328125, 1.10888671875, 1.18719482421875, 1.2655029296875, 1.34381103515625, 1.422119140625, 1.50042724609375, 1.5787353515625, 1.65704345703125, 1.7353515625, 1.81365966796875, 1.8919677734375, 1.97027587890625, 2.048583984375, 2.12689208984375, 2.2052001953125, 2.28350830078125, 2.36181640625, 2.44012451171875, 2.5184326171875, 2.59674072265625, 2.675048828125, 2.75335693359375, 2.8316650390625, 2.90997314453125, 2.98828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 9.0, 19.0, 16.0, 18.0, 35.0, 29.0, 40.0, 39.0, 58.0, 47.0, 66.0, 55.0, 58.0, 73.0, 74.0, 56.0, 47.0, 48.0, 41.0, 33.0, 27.0, 15.0, 10.0, 18.0, 15.0, 7.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.1488628387451172, -0.14342880249023438, -0.13799476623535156, -0.13256072998046875, -0.12712669372558594, -0.12169265747070312, -0.11625862121582031, -0.1108245849609375, -0.10539054870605469, -0.09995651245117188, -0.09452247619628906, -0.08908843994140625, -0.08365440368652344, -0.07822036743164062, -0.07278633117675781, -0.067352294921875, -0.06191825866699219, -0.056484222412109375, -0.05105018615722656, -0.04561614990234375, -0.04018211364746094, -0.034748077392578125, -0.029314041137695312, -0.0238800048828125, -0.018445968627929688, -0.013011932373046875, -0.0075778961181640625, -0.00214385986328125, 0.0032901763916015625, 0.008724212646484375, 0.014158248901367188, 0.01959228515625, 0.025026321411132812, 0.030460357666015625, 0.03589439392089844, 0.04132843017578125, 0.04676246643066406, 0.052196502685546875, 0.05763053894042969, 0.0630645751953125, 0.06849861145019531, 0.07393264770507812, 0.07936668395996094, 0.08480072021484375, 0.09023475646972656, 0.09566879272460938, 0.10110282897949219, 0.106536865234375, 0.11197090148925781, 0.11740493774414062, 0.12283897399902344, 0.12827301025390625, 0.13370704650878906, 0.13914108276367188, 0.1445751190185547, 0.1500091552734375, 0.1554431915283203, 0.16087722778320312, 0.16631126403808594, 0.17174530029296875, 0.17717933654785156, 0.18261337280273438, 0.1880474090576172, 0.1934814453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 10.0, 15.0, 32.0, 41.0, 50.0, 61.0, 85.0, 101.0, 206.0, 445.0, 1094.0, 4926.0, 51678.0, 3974024.0, 149846.0, 8785.0, 1690.0, 541.0, 225.0, 113.0, 71.0, 52.0, 52.0, 30.0, 29.0, 8.0, 15.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.890625, -1.819671630859375, -1.74871826171875, -1.677764892578125, -1.6068115234375, -1.535858154296875, -1.46490478515625, -1.393951416015625, -1.322998046875, -1.252044677734375, -1.18109130859375, -1.110137939453125, -1.0391845703125, -0.968231201171875, -0.89727783203125, -0.826324462890625, -0.75537109375, -0.684417724609375, -0.61346435546875, -0.542510986328125, -0.4715576171875, -0.400604248046875, -0.32965087890625, -0.258697509765625, -0.187744140625, -0.116790771484375, -0.04583740234375, 0.025115966796875, 0.0960693359375, 0.167022705078125, 0.23797607421875, 0.308929443359375, 0.3798828125, 0.450836181640625, 0.52178955078125, 0.592742919921875, 0.6636962890625, 0.734649658203125, 0.80560302734375, 0.876556396484375, 0.947509765625, 1.018463134765625, 1.08941650390625, 1.160369873046875, 1.2313232421875, 1.302276611328125, 1.37322998046875, 1.444183349609375, 1.51513671875, 1.586090087890625, 1.65704345703125, 1.727996826171875, 1.7989501953125, 1.869903564453125, 1.94085693359375, 2.011810302734375, 2.082763671875, 2.153717041015625, 2.22467041015625, 2.295623779296875, 2.3665771484375, 2.437530517578125, 2.50848388671875, 2.579437255859375, 2.650390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 8.0, 15.0, 20.0, 46.0, 85.0, 240.0, 1028.0, 2074.0, 331.0, 126.0, 46.0, 16.0, 15.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.0322265625, -1.0120468139648438, -0.9918670654296875, -0.9716873168945312, -0.951507568359375, -0.9313278198242188, -0.9111480712890625, -0.8909683227539062, -0.87078857421875, -0.8506088256835938, -0.8304290771484375, -0.8102493286132812, -0.790069580078125, -0.7698898315429688, -0.7497100830078125, -0.7295303344726562, -0.7093505859375, -0.6891708374023438, -0.6689910888671875, -0.6488113403320312, -0.628631591796875, -0.6084518432617188, -0.5882720947265625, -0.5680923461914062, -0.54791259765625, -0.5277328491210938, -0.5075531005859375, -0.48737335205078125, -0.467193603515625, -0.44701385498046875, -0.4268341064453125, -0.40665435791015625, -0.386474609375, -0.36629486083984375, -0.3461151123046875, -0.32593536376953125, -0.305755615234375, -0.28557586669921875, -0.2653961181640625, -0.24521636962890625, -0.22503662109375, -0.20485687255859375, -0.1846771240234375, -0.16449737548828125, -0.144317626953125, -0.12413787841796875, -0.1039581298828125, -0.08377838134765625, -0.0635986328125, -0.04341888427734375, -0.0232391357421875, -0.00305938720703125, 0.017120361328125, 0.03730010986328125, 0.0574798583984375, 0.07765960693359375, 0.09783935546875, 0.11801910400390625, 0.1381988525390625, 0.15837860107421875, 0.178558349609375, 0.19873809814453125, 0.2189178466796875, 0.23909759521484375, 0.25927734375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 33.0, 134.0, 343.0, 276.0, 133.0, 36.0, 11.0, 6.0, 2.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.465598106384277, -9.280097007751465, -9.094595909118652, -8.90909481048584, -8.723592758178711, -8.538091659545898, -8.352590560913086, -8.167089462280273, -7.981588363647461, -7.796087265014648, -7.610585689544678, -7.425084590911865, -7.239583492279053, -7.05408239364624, -6.8685808181762695, -6.683079719543457, -6.4975786209106445, -6.312077522277832, -6.126575946807861, -5.941074848175049, -5.755573749542236, -5.570072650909424, -5.384571075439453, -5.199069976806641, -5.01356840133667, -4.828067302703857, -4.642565727233887, -4.457064628601074, -4.271563529968262, -4.086062431335449, -3.9005608558654785, -3.715059757232666, -3.5295586585998535, -3.344057321548462, -3.1585562229156494, -2.973054885864258, -2.7875537872314453, -2.6020524501800537, -2.416551113128662, -2.2310500144958496, -2.045548915863037, -1.860047698020935, -1.674546480178833, -1.4890451431274414, -1.303544044494629, -1.1180427074432373, -0.9325414896011353, -0.7470402717590332, -0.5615389347076416, -0.37603771686553955, -0.1905364692211151, -0.005035221576690674, 0.18046599626541138, 0.3659672141075134, 0.5514684915542603, 0.7369697093963623, 0.9224709272384644, 1.1079721450805664, 1.2934733629226685, 1.4789745807647705, 1.664475917816162, 1.8499770164489746, 2.035478353500366, 2.220979690551758, 2.4064807891845703]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 16.0, 18.0, 21.0, 35.0, 53.0, 57.0, 67.0, 68.0, 68.0, 89.0, 81.0, 76.0, 68.0, 71.0, 60.0, 41.0, 28.0, 29.0, 19.0, 11.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3186640739440918, -1.2607791423797607, -1.2028943300247192, -1.1450093984603882, -1.0871244668960571, -1.0292396545410156, -0.9713547229766846, -0.9134698510169983, -0.855584979057312, -0.7977001070976257, -0.7398151755332947, -0.6819303035736084, -0.6240454316139221, -0.5661605596542358, -0.5082756280899048, -0.4503907561302185, -0.39250582456588745, -0.3346209228038788, -0.2767360508441925, -0.21885114908218384, -0.16096626222133636, -0.10308137536048889, -0.045196473598480225, 0.012688398361206055, 0.07057330012321472, 0.1284581869840622, 0.18634307384490967, 0.24422797560691833, 0.302112877368927, 0.3599977493286133, 0.41788265109062195, 0.4757675230503082, 0.5336524248123169, 0.5915372967720032, 0.6494222283363342, 0.7073071002960205, 0.7651919722557068, 0.8230768442153931, 0.8809617757797241, 0.9388466477394104, 0.9967315196990967, 1.0546164512634277, 1.1125012636184692, 1.1703861951828003, 1.2282711267471313, 1.2861559391021729, 1.344040870666504, 1.401925802230835, 1.459810733795166, 1.517695665359497, 1.5755804777145386, 1.6334654092788696, 1.6913503408432007, 1.7492351531982422, 1.8071200847625732, 1.8650050163269043, 1.9228898286819458, 1.9807747602462769, 2.0386595726013184, 2.0965445041656494, 2.1544294357299805, 2.2123143672943115, 2.2701992988586426, 2.3280839920043945, 2.3859689235687256]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 9.0, 14.0, 21.0, 30.0, 36.0, 78.0, 172.0, 402.0, 1243.0, 6591.0, 100170.0, 840674.0, 90955.0, 6122.0, 1235.0, 435.0, 156.0, 75.0, 45.0, 39.0, 23.0, 6.0, 5.0, 6.0, 0.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9140625, -1.838958740234375, -1.76385498046875, -1.688751220703125, -1.6136474609375, -1.538543701171875, -1.46343994140625, -1.388336181640625, -1.313232421875, -1.238128662109375, -1.16302490234375, -1.087921142578125, -1.0128173828125, -0.937713623046875, -0.86260986328125, -0.787506103515625, -0.71240234375, -0.637298583984375, -0.56219482421875, -0.487091064453125, -0.4119873046875, -0.336883544921875, -0.26177978515625, -0.186676025390625, -0.111572265625, -0.036468505859375, 0.03863525390625, 0.113739013671875, 0.1888427734375, 0.263946533203125, 0.33905029296875, 0.414154052734375, 0.4892578125, 0.564361572265625, 0.63946533203125, 0.714569091796875, 0.7896728515625, 0.864776611328125, 0.93988037109375, 1.014984130859375, 1.090087890625, 1.165191650390625, 1.24029541015625, 1.315399169921875, 1.3905029296875, 1.465606689453125, 1.54071044921875, 1.615814208984375, 1.69091796875, 1.766021728515625, 1.84112548828125, 1.916229248046875, 1.9913330078125, 2.066436767578125, 2.14154052734375, 2.216644287109375, 2.291748046875, 2.366851806640625, 2.44195556640625, 2.517059326171875, 2.5921630859375, 2.667266845703125, 2.74237060546875, 2.817474365234375, 2.892578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 15.0, 14.0, 11.0, 23.0, 25.0, 24.0, 34.0, 36.0, 39.0, 49.0, 42.0, 69.0, 61.0, 63.0, 59.0, 60.0, 60.0, 37.0, 47.0, 38.0, 49.0, 33.0, 17.0, 21.0, 12.0, 13.0, 9.0, 13.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.1684246063232422, -0.16289901733398438, -0.15737342834472656, -0.15184783935546875, -0.14632225036621094, -0.14079666137695312, -0.1352710723876953, -0.1297454833984375, -0.12421989440917969, -0.11869430541992188, -0.11316871643066406, -0.10764312744140625, -0.10211753845214844, -0.09659194946289062, -0.09106636047363281, -0.085540771484375, -0.08001518249511719, -0.07448959350585938, -0.06896400451660156, -0.06343841552734375, -0.05791282653808594, -0.052387237548828125, -0.04686164855957031, -0.0413360595703125, -0.03581047058105469, -0.030284881591796875, -0.024759292602539062, -0.01923370361328125, -0.013708114624023438, -0.008182525634765625, -0.0026569366455078125, 0.00286865234375, 0.008394241333007812, 0.013919830322265625, 0.019445419311523438, 0.02497100830078125, 0.030496597290039062, 0.036022186279296875, 0.04154777526855469, 0.0470733642578125, 0.05259895324707031, 0.058124542236328125, 0.06365013122558594, 0.06917572021484375, 0.07470130920410156, 0.08022689819335938, 0.08575248718261719, 0.091278076171875, 0.09680366516113281, 0.10232925415039062, 0.10785484313964844, 0.11338043212890625, 0.11890602111816406, 0.12443161010742188, 0.1299571990966797, 0.1354827880859375, 0.1410083770751953, 0.14653396606445312, 0.15205955505371094, 0.15758514404296875, 0.16311073303222656, 0.16863632202148438, 0.1741619110107422, 0.1796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 5.0, 7.0, 13.0, 16.0, 33.0, 27.0, 51.0, 92.0, 169.0, 266.0, 542.0, 1238.0, 3119.0, 8604.0, 25745.0, 82736.0, 266937.0, 423069.0, 161054.0, 49475.0, 16092.0, 5412.0, 2031.0, 818.0, 427.0, 222.0, 135.0, 75.0, 46.0, 41.0, 20.0, 10.0, 4.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7978515625, -0.7764511108398438, -0.7550506591796875, -0.7336502075195312, -0.712249755859375, -0.6908493041992188, -0.6694488525390625, -0.6480484008789062, -0.62664794921875, -0.6052474975585938, -0.5838470458984375, -0.5624465942382812, -0.541046142578125, -0.5196456909179688, -0.4982452392578125, -0.47684478759765625, -0.4554443359375, -0.43404388427734375, -0.4126434326171875, -0.39124298095703125, -0.369842529296875, -0.34844207763671875, -0.3270416259765625, -0.30564117431640625, -0.28424072265625, -0.26284027099609375, -0.2414398193359375, -0.22003936767578125, -0.198638916015625, -0.17723846435546875, -0.1558380126953125, -0.13443756103515625, -0.113037109375, -0.09163665771484375, -0.0702362060546875, -0.04883575439453125, -0.027435302734375, -0.00603485107421875, 0.0153656005859375, 0.03676605224609375, 0.05816650390625, 0.07956695556640625, 0.1009674072265625, 0.12236785888671875, 0.143768310546875, 0.16516876220703125, 0.1865692138671875, 0.20796966552734375, 0.2293701171875, 0.25077056884765625, 0.2721710205078125, 0.29357147216796875, 0.314971923828125, 0.33637237548828125, 0.3577728271484375, 0.37917327880859375, 0.40057373046875, 0.42197418212890625, 0.4433746337890625, 0.46477508544921875, 0.486175537109375, 0.5075759887695312, 0.5289764404296875, 0.5503768920898438, 0.57177734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 22.0, 12.0, 13.0, 17.0, 16.0, 20.0, 25.0, 26.0, 24.0, 34.0, 38.0, 43.0, 46.0, 42.0, 40.0, 41.0, 45.0, 38.0, 44.0, 45.0, 31.0, 39.0, 24.0, 27.0, 32.0, 23.0, 27.0, 24.0, 22.0, 15.0, 13.0, 19.0, 8.0, 8.0, 5.0, 7.0, 4.0, 4.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5068359375, -0.4906768798828125, -0.474517822265625, -0.4583587646484375, -0.44219970703125, -0.4260406494140625, -0.409881591796875, -0.3937225341796875, -0.3775634765625, -0.3614044189453125, -0.345245361328125, -0.3290863037109375, -0.31292724609375, -0.2967681884765625, -0.280609130859375, -0.2644500732421875, -0.248291015625, -0.2321319580078125, -0.215972900390625, -0.1998138427734375, -0.18365478515625, -0.1674957275390625, -0.151336669921875, -0.1351776123046875, -0.1190185546875, -0.1028594970703125, -0.086700439453125, -0.0705413818359375, -0.05438232421875, -0.0382232666015625, -0.022064208984375, -0.0059051513671875, 0.01025390625, 0.0264129638671875, 0.042572021484375, 0.0587310791015625, 0.07489013671875, 0.0910491943359375, 0.107208251953125, 0.1233673095703125, 0.1395263671875, 0.1556854248046875, 0.171844482421875, 0.1880035400390625, 0.20416259765625, 0.2203216552734375, 0.236480712890625, 0.2526397705078125, 0.268798828125, 0.2849578857421875, 0.301116943359375, 0.3172760009765625, 0.33343505859375, 0.3495941162109375, 0.365753173828125, 0.3819122314453125, 0.3980712890625, 0.4142303466796875, 0.430389404296875, 0.4465484619140625, 0.46270751953125, 0.4788665771484375, 0.495025634765625, 0.5111846923828125, 0.52734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 15.0, 39.0, 52.0, 81.0, 175.0, 375.0, 1071.0, 3442.0, 14639.0, 89250.0, 583425.0, 305159.0, 39949.0, 7593.0, 1955.0, 678.0, 304.0, 155.0, 60.0, 42.0, 33.0, 14.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.389892578125, -0.3753395080566406, -0.36078643798828125, -0.3462333679199219, -0.3316802978515625, -0.3171272277832031, -0.30257415771484375, -0.2880210876464844, -0.273468017578125, -0.2589149475097656, -0.24436187744140625, -0.22980880737304688, -0.2152557373046875, -0.20070266723632812, -0.18614959716796875, -0.17159652709960938, -0.15704345703125, -0.14249038696289062, -0.12793731689453125, -0.11338424682617188, -0.0988311767578125, -0.08427810668945312, -0.06972503662109375, -0.055171966552734375, -0.040618896484375, -0.026065826416015625, -0.01151275634765625, 0.003040313720703125, 0.0175933837890625, 0.032146453857421875, 0.04669952392578125, 0.061252593994140625, 0.0758056640625, 0.09035873413085938, 0.10491180419921875, 0.11946487426757812, 0.1340179443359375, 0.14857101440429688, 0.16312408447265625, 0.17767715454101562, 0.192230224609375, 0.20678329467773438, 0.22133636474609375, 0.23588943481445312, 0.2504425048828125, 0.2649955749511719, 0.27954864501953125, 0.2941017150878906, 0.30865478515625, 0.3232078552246094, 0.33776092529296875, 0.3523139953613281, 0.3668670654296875, 0.3814201354980469, 0.39597320556640625, 0.4105262756347656, 0.425079345703125, 0.4396324157714844, 0.45418548583984375, 0.4687385559082031, 0.4832916259765625, 0.4978446960449219, 0.5123977661132812, 0.5269508361816406, 0.54150390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 5.0, 9.0, 4.0, 12.0, 14.0, 27.0, 36.0, 49.0, 81.0, 101.0, 114.0, 117.0, 114.0, 87.0, 58.0, 40.0, 26.0, 22.0, 15.0, 16.0, 9.0, 12.0, 2.0, 6.0, 8.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.018182754516602e-05, -8.738785982131958e-05, -8.459389209747314e-05, -8.179992437362671e-05, -7.900595664978027e-05, -7.621198892593384e-05, -7.34180212020874e-05, -7.062405347824097e-05, -6.783008575439453e-05, -6.50361180305481e-05, -6.224215030670166e-05, -5.9448182582855225e-05, -5.665421485900879e-05, -5.3860247135162354e-05, -5.106627941131592e-05, -4.827231168746948e-05, -4.547834396362305e-05, -4.268437623977661e-05, -3.9890408515930176e-05, -3.709644079208374e-05, -3.4302473068237305e-05, -3.150850534439087e-05, -2.8714537620544434e-05, -2.5920569896697998e-05, -2.3126602172851562e-05, -2.0332634449005127e-05, -1.753866672515869e-05, -1.4744699001312256e-05, -1.195073127746582e-05, -9.156763553619385e-06, -6.362795829772949e-06, -3.5688281059265137e-06, -7.748603820800781e-07, 2.0191073417663574e-06, 4.813075065612793e-06, 7.6070427894592285e-06, 1.0401010513305664e-05, 1.31949782371521e-05, 1.5988945960998535e-05, 1.878291368484497e-05, 2.1576881408691406e-05, 2.4370849132537842e-05, 2.7164816856384277e-05, 2.9958784580230713e-05, 3.275275230407715e-05, 3.5546720027923584e-05, 3.834068775177002e-05, 4.1134655475616455e-05, 4.392862319946289e-05, 4.6722590923309326e-05, 4.951655864715576e-05, 5.23105263710022e-05, 5.510449409484863e-05, 5.789846181869507e-05, 6.0692429542541504e-05, 6.348639726638794e-05, 6.628036499023438e-05, 6.907433271408081e-05, 7.186830043792725e-05, 7.466226816177368e-05, 7.745623588562012e-05, 8.025020360946655e-05, 8.304417133331299e-05, 8.583813905715942e-05, 8.863210678100586e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 12.0, 8.0, 15.0, 22.0, 33.0, 48.0, 81.0, 112.0, 164.0, 264.0, 624.0, 1396.0, 4335.0, 15932.0, 78986.0, 533136.0, 348029.0, 49147.0, 10807.0, 3043.0, 1132.0, 518.0, 286.0, 147.0, 87.0, 51.0, 32.0, 30.0, 26.0, 13.0, 9.0, 7.0, 7.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3853416442871094, -0.37151336669921875, -0.3576850891113281, -0.3438568115234375, -0.3300285339355469, -0.31620025634765625, -0.3023719787597656, -0.288543701171875, -0.2747154235839844, -0.26088714599609375, -0.24705886840820312, -0.2332305908203125, -0.21940231323242188, -0.20557403564453125, -0.19174575805664062, -0.17791748046875, -0.16408920288085938, -0.15026092529296875, -0.13643264770507812, -0.1226043701171875, -0.10877609252929688, -0.09494781494140625, -0.08111953735351562, -0.067291259765625, -0.053462982177734375, -0.03963470458984375, -0.025806427001953125, -0.0119781494140625, 0.001850128173828125, 0.01567840576171875, 0.029506683349609375, 0.0433349609375, 0.057163238525390625, 0.07099151611328125, 0.08481979370117188, 0.0986480712890625, 0.11247634887695312, 0.12630462646484375, 0.14013290405273438, 0.153961181640625, 0.16778945922851562, 0.18161773681640625, 0.19544601440429688, 0.2092742919921875, 0.22310256958007812, 0.23693084716796875, 0.2507591247558594, 0.26458740234375, 0.2784156799316406, 0.29224395751953125, 0.3060722351074219, 0.3199005126953125, 0.3337287902832031, 0.34755706787109375, 0.3613853454589844, 0.375213623046875, 0.3890419006347656, 0.40287017822265625, 0.4166984558105469, 0.4305267333984375, 0.4443550109863281, 0.45818328857421875, 0.4720115661621094, 0.48583984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 11.0, 10.0, 10.0, 15.0, 22.0, 35.0, 45.0, 45.0, 71.0, 72.0, 51.0, 95.0, 85.0, 94.0, 71.0, 59.0, 49.0, 28.0, 21.0, 18.0, 23.0, 7.0, 15.0, 8.0, 2.0, 9.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243896484375, -0.235107421875, -0.226318359375, -0.217529296875, -0.208740234375, -0.199951171875, -0.191162109375, -0.182373046875, -0.173583984375, -0.164794921875, -0.156005859375, -0.147216796875, -0.138427734375, -0.129638671875, -0.120849609375, -0.112060546875, -0.103271484375, -0.094482421875, -0.085693359375, -0.076904296875, -0.068115234375, -0.059326171875, -0.050537109375, -0.041748046875, -0.032958984375, -0.024169921875, -0.015380859375, -0.006591796875, 0.002197265625, 0.010986328125, 0.019775390625, 0.028564453125, 0.037353515625, 0.046142578125, 0.054931640625, 0.063720703125, 0.072509765625, 0.081298828125, 0.090087890625, 0.098876953125, 0.107666015625, 0.116455078125, 0.125244140625, 0.134033203125, 0.142822265625, 0.151611328125, 0.160400390625, 0.169189453125, 0.177978515625, 0.186767578125, 0.195556640625, 0.204345703125, 0.213134765625, 0.221923828125, 0.230712890625, 0.239501953125, 0.248291015625, 0.257080078125, 0.265869140625, 0.274658203125, 0.283447265625, 0.292236328125, 0.301025390625, 0.309814453125, 0.318603515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 16.0, 60.0, 139.0, 251.0, 247.0, 177.0, 82.0, 20.0, 8.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.825963973999023, -16.469953536987305, -16.11394500732422, -15.7579345703125, -15.401925086975098, -15.045915603637695, -14.689906120300293, -14.33389663696289, -13.977886199951172, -13.62187671661377, -13.265867233276367, -12.909856796264648, -12.553847312927246, -12.197837829589844, -11.841828346252441, -11.485818862915039, -11.129809379577637, -10.773799896240234, -10.417790412902832, -10.06178092956543, -9.705770492553711, -9.349761009216309, -8.993751525878906, -8.637742042541504, -8.281732559204102, -7.925723075866699, -7.569713115692139, -7.213703632354736, -6.857693672180176, -6.501684188842773, -6.145674705505371, -5.789665222167969, -5.433655261993408, -5.077645778656006, -4.721635818481445, -4.365626335144043, -4.009616851806641, -3.65360689163208, -3.2975974082946777, -2.9415876865386963, -2.585577964782715, -2.2295682430267334, -1.8735586404800415, -1.5175490379333496, -1.1615393161773682, -0.8055295944213867, -0.4495201110839844, -0.09351038932800293, 0.2624993324279785, 0.6185089945793152, 0.9745186567306519, 1.3305282592773438, 1.6865379810333252, 2.0425477027893066, 2.398557186126709, 2.7545669078826904, 3.110576629638672, 3.4665863513946533, 3.8225960731506348, 4.178605556488037, 4.534615516662598, 4.890625, 5.246634483337402, 5.602643966674805, 5.958653926849365]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 8.0, 5.0, 9.0, 10.0, 7.0, 21.0, 19.0, 15.0, 29.0, 25.0, 21.0, 38.0, 30.0, 38.0, 43.0, 51.0, 47.0, 48.0, 42.0, 40.0, 52.0, 43.0, 34.0, 42.0, 35.0, 36.0, 27.0, 33.0, 23.0, 23.0, 19.0, 18.0, 15.0, 6.0, 3.0, 12.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5132555961608887, -2.428422212600708, -2.3435890674591064, -2.258755683898926, -2.173922300338745, -2.0890889167785645, -2.004255771636963, -1.9194223880767822, -1.8345891237258911, -1.749755859375, -1.6649224758148193, -1.5800892114639282, -1.495255947113037, -1.4104225635528564, -1.3255892992019653, -1.2407560348510742, -1.1559226512908936, -1.0710893869400024, -0.9862560033798218, -0.9014227390289307, -0.8165894150733948, -0.7317560911178589, -0.6469228267669678, -0.5620895028114319, -0.477256178855896, -0.3924228549003601, -0.3075895607471466, -0.2227562665939331, -0.13792294263839722, -0.05308961868286133, 0.031743645668029785, 0.11657696962356567, 0.20141029357910156, 0.28624361753463745, 0.37107691168785095, 0.45591020584106445, 0.5407435297966003, 0.6255768537521362, 0.7104101181030273, 0.7952434420585632, 0.8800767660140991, 0.964910089969635, 1.049743413925171, 1.134576678276062, 1.2194099426269531, 1.3042433261871338, 1.389076590538025, 1.473909854888916, 1.5587432384490967, 1.6435765027999878, 1.7284098863601685, 1.8132431507110596, 1.8980765342712402, 1.9829097986221313, 2.0677430629730225, 2.152576446533203, 2.2374095916748047, 2.3222429752349854, 2.407076120376587, 2.4919095039367676, 2.5767428874969482, 2.661576271057129, 2.7464094161987305, 2.831242799758911, 2.916076183319092]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 18.0, 28.0, 36.0, 33.0, 53.0, 96.0, 183.0, 351.0, 685.0, 1539.0, 3965.0, 13393.0, 94671.0, 3904053.0, 149659.0, 17776.0, 4545.0, 1660.0, 689.0, 327.0, 188.0, 109.0, 52.0, 42.0, 29.0, 19.0, 14.0, 15.0, 9.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9111328125, -1.854217529296875, -1.79730224609375, -1.740386962890625, -1.6834716796875, -1.626556396484375, -1.56964111328125, -1.512725830078125, -1.455810546875, -1.398895263671875, -1.34197998046875, -1.285064697265625, -1.2281494140625, -1.171234130859375, -1.11431884765625, -1.057403564453125, -1.00048828125, -0.943572998046875, -0.88665771484375, -0.829742431640625, -0.7728271484375, -0.715911865234375, -0.65899658203125, -0.602081298828125, -0.545166015625, -0.488250732421875, -0.43133544921875, -0.374420166015625, -0.3175048828125, -0.260589599609375, -0.20367431640625, -0.146759033203125, -0.08984375, -0.032928466796875, 0.02398681640625, 0.080902099609375, 0.1378173828125, 0.194732666015625, 0.25164794921875, 0.308563232421875, 0.365478515625, 0.422393798828125, 0.47930908203125, 0.536224365234375, 0.5931396484375, 0.650054931640625, 0.70697021484375, 0.763885498046875, 0.82080078125, 0.877716064453125, 0.93463134765625, 0.991546630859375, 1.0484619140625, 1.105377197265625, 1.16229248046875, 1.219207763671875, 1.276123046875, 1.333038330078125, 1.38995361328125, 1.446868896484375, 1.5037841796875, 1.560699462890625, 1.61761474609375, 1.674530029296875, 1.7314453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 8.0, 12.0, 12.0, 9.0, 29.0, 26.0, 34.0, 33.0, 35.0, 46.0, 40.0, 41.0, 56.0, 61.0, 53.0, 57.0, 59.0, 55.0, 51.0, 46.0, 38.0, 32.0, 26.0, 28.0, 29.0, 26.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1812744140625, -0.1757221221923828, -0.17016983032226562, -0.16461753845214844, -0.15906524658203125, -0.15351295471191406, -0.14796066284179688, -0.1424083709716797, -0.1368560791015625, -0.1313037872314453, -0.12575149536132812, -0.12019920349121094, -0.11464691162109375, -0.10909461975097656, -0.10354232788085938, -0.09799003601074219, -0.092437744140625, -0.08688545227050781, -0.08133316040039062, -0.07578086853027344, -0.07022857666015625, -0.06467628479003906, -0.059123992919921875, -0.05357170104980469, -0.0480194091796875, -0.04246711730957031, -0.036914825439453125, -0.03136253356933594, -0.02581024169921875, -0.020257949829101562, -0.014705657958984375, -0.009153366088867188, -0.00360107421875, 0.0019512176513671875, 0.007503509521484375, 0.013055801391601562, 0.01860809326171875, 0.024160385131835938, 0.029712677001953125, 0.03526496887207031, 0.0408172607421875, 0.04636955261230469, 0.051921844482421875, 0.05747413635253906, 0.06302642822265625, 0.06857872009277344, 0.07413101196289062, 0.07968330383300781, 0.085235595703125, 0.09078788757324219, 0.09634017944335938, 0.10189247131347656, 0.10744476318359375, 0.11299705505371094, 0.11854934692382812, 0.12410163879394531, 0.1296539306640625, 0.1352062225341797, 0.14075851440429688, 0.14631080627441406, 0.15186309814453125, 0.15741539001464844, 0.16296768188476562, 0.1685199737548828, 0.174072265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 14.0, 21.0, 43.0, 61.0, 55.0, 106.0, 226.0, 351.0, 681.0, 1580.0, 5380.0, 25150.0, 373403.0, 3707523.0, 65019.0, 9861.0, 2641.0, 980.0, 487.0, 265.0, 159.0, 91.0, 56.0, 41.0, 30.0, 21.0, 10.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.27447509765625, -2.2149658203125, -2.15545654296875, -2.095947265625, -2.03643798828125, -1.9769287109375, -1.91741943359375, -1.85791015625, -1.79840087890625, -1.7388916015625, -1.67938232421875, -1.619873046875, -1.56036376953125, -1.5008544921875, -1.44134521484375, -1.3818359375, -1.32232666015625, -1.2628173828125, -1.20330810546875, -1.143798828125, -1.08428955078125, -1.0247802734375, -0.96527099609375, -0.90576171875, -0.84625244140625, -0.7867431640625, -0.72723388671875, -0.667724609375, -0.60821533203125, -0.5487060546875, -0.48919677734375, -0.4296875, -0.37017822265625, -0.3106689453125, -0.25115966796875, -0.191650390625, -0.13214111328125, -0.0726318359375, -0.01312255859375, 0.04638671875, 0.10589599609375, 0.1654052734375, 0.22491455078125, 0.284423828125, 0.34393310546875, 0.4034423828125, 0.46295166015625, 0.5224609375, 0.58197021484375, 0.6414794921875, 0.70098876953125, 0.760498046875, 0.82000732421875, 0.8795166015625, 0.93902587890625, 0.99853515625, 1.05804443359375, 1.1175537109375, 1.17706298828125, 1.236572265625, 1.29608154296875, 1.3555908203125, 1.41510009765625, 1.474609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 5.0, 13.0, 14.0, 23.0, 35.0, 74.0, 106.0, 227.0, 781.0, 2061.0, 356.0, 146.0, 73.0, 58.0, 34.0, 14.0, 12.0, 11.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3812408447265625, -0.365509033203125, -0.3497772216796875, -0.33404541015625, -0.3183135986328125, -0.302581787109375, -0.2868499755859375, -0.2711181640625, -0.2553863525390625, -0.239654541015625, -0.2239227294921875, -0.20819091796875, -0.1924591064453125, -0.176727294921875, -0.1609954833984375, -0.145263671875, -0.1295318603515625, -0.113800048828125, -0.0980682373046875, -0.08233642578125, -0.0666046142578125, -0.050872802734375, -0.0351409912109375, -0.0194091796875, -0.0036773681640625, 0.012054443359375, 0.0277862548828125, 0.04351806640625, 0.0592498779296875, 0.074981689453125, 0.0907135009765625, 0.1064453125, 0.1221771240234375, 0.137908935546875, 0.1536407470703125, 0.16937255859375, 0.1851043701171875, 0.200836181640625, 0.2165679931640625, 0.2322998046875, 0.2480316162109375, 0.263763427734375, 0.2794952392578125, 0.29522705078125, 0.3109588623046875, 0.326690673828125, 0.3424224853515625, 0.358154296875, 0.3738861083984375, 0.389617919921875, 0.4053497314453125, 0.42108154296875, 0.4368133544921875, 0.452545166015625, 0.4682769775390625, 0.4840087890625, 0.4997406005859375, 0.515472412109375, 0.5312042236328125, 0.54693603515625, 0.5626678466796875, 0.578399658203125, 0.5941314697265625, 0.60986328125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 34.0, 103.0, 261.0, 330.0, 181.0, 46.0, 18.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.936696529388428, -5.757986068725586, -5.579276084899902, -5.4005656242370605, -5.221855163574219, -5.043145179748535, -4.864434719085693, -4.685724258422852, -4.507014274597168, -4.328303813934326, -4.149593830108643, -3.970883369445801, -3.792172908782959, -3.6134626865386963, -3.4347524642944336, -3.256042003631592, -3.07733154296875, -2.8986213207244873, -2.7199108600616455, -2.541200637817383, -2.362490177154541, -2.1837799549102783, -2.0050697326660156, -1.8263593912124634, -1.6476490497589111, -1.4689387083053589, -1.2902283668518066, -1.111518144607544, -0.9328078031539917, -0.7540974617004395, -0.5753872394561768, -0.3966768980026245, -0.21796703338623047, -0.03925672173500061, 0.13945358991622925, 0.3181638717651367, 0.49687421321868896, 0.6755845546722412, 0.8542947769165039, 1.0330051183700562, 1.2117154598236084, 1.3904258012771606, 1.569136142730713, 1.7478463649749756, 1.9265567064285278, 2.10526704788208, 2.2839772701263428, 2.4626874923706055, 2.6413979530334473, 2.82010817527771, 2.9988186359405518, 3.1775288581848145, 3.3562393188476562, 3.534949541091919, 3.7136597633361816, 3.8923702239990234, 4.071080207824707, 4.249790668487549, 4.428500652313232, 4.607211112976074, 4.785921573638916, 4.964632034301758, 5.143342018127441, 5.322052478790283, 5.500762939453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 14.0, 12.0, 10.0, 19.0, 14.0, 31.0, 32.0, 41.0, 35.0, 53.0, 54.0, 48.0, 66.0, 70.0, 55.0, 50.0, 61.0, 62.0, 44.0, 37.0, 35.0, 25.0, 32.0, 26.0, 22.0, 9.0, 4.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4183084964752197, -1.3751988410949707, -1.3320890665054321, -1.288979411125183, -1.245869755744934, -1.2027599811553955, -1.1596503257751465, -1.1165406703948975, -1.0734310150146484, -1.0303213596343994, -0.9872116446495056, -0.9441019296646118, -0.9009922742843628, -0.857882559299469, -0.8147728443145752, -0.7716631889343262, -0.7285534143447876, -0.6854436993598938, -0.6423340439796448, -0.599224328994751, -0.556114673614502, -0.5130049586296082, -0.46989524364471436, -0.42678555846214294, -0.38367587327957153, -0.3405661880970001, -0.2974565029144287, -0.2543467879295349, -0.2112371027469635, -0.1681274175643921, -0.1250177025794983, -0.08190801739692688, -0.03879821300506592, 0.00431147962808609, 0.0474211722612381, 0.0905308723449707, 0.13364055752754211, 0.17675024271011353, 0.21985995769500732, 0.26296964287757874, 0.30607932806015015, 0.34918901324272156, 0.39229869842529297, 0.43540841341018677, 0.4785180985927582, 0.5216277837753296, 0.5647374987602234, 0.6078472137451172, 0.6509568691253662, 0.69406658411026, 0.737176239490509, 0.7802859544754028, 0.8233956098556519, 0.8665053248405457, 0.9096150398254395, 0.9527246952056885, 0.9958344101905823, 1.038944125175476, 1.082053780555725, 1.1251635551452637, 1.1682732105255127, 1.2113828659057617, 1.2544925212860107, 1.2976022958755493, 1.3407119512557983]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 8.0, 16.0, 16.0, 18.0, 28.0, 33.0, 41.0, 73.0, 137.0, 209.0, 326.0, 653.0, 1289.0, 2954.0, 8017.0, 25662.0, 93509.0, 315171.0, 402326.0, 141033.0, 38171.0, 11266.0, 4024.0, 1659.0, 820.0, 437.0, 236.0, 148.0, 76.0, 65.0, 31.0, 35.0, 19.0, 11.0, 11.0, 5.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.97509765625, -0.9404678344726562, -0.9058380126953125, -0.8712081909179688, -0.836578369140625, -0.8019485473632812, -0.7673187255859375, -0.7326889038085938, -0.69805908203125, -0.6634292602539062, -0.6287994384765625, -0.5941696166992188, -0.559539794921875, -0.5249099731445312, -0.4902801513671875, -0.45565032958984375, -0.4210205078125, -0.38639068603515625, -0.3517608642578125, -0.31713104248046875, -0.282501220703125, -0.24787139892578125, -0.2132415771484375, -0.17861175537109375, -0.14398193359375, -0.10935211181640625, -0.0747222900390625, -0.04009246826171875, -0.005462646484375, 0.02916717529296875, 0.0637969970703125, 0.09842681884765625, 0.133056640625, 0.16768646240234375, 0.2023162841796875, 0.23694610595703125, 0.271575927734375, 0.30620574951171875, 0.3408355712890625, 0.37546539306640625, 0.41009521484375, 0.44472503662109375, 0.4793548583984375, 0.5139846801757812, 0.548614501953125, 0.5832443237304688, 0.6178741455078125, 0.6525039672851562, 0.6871337890625, 0.7217636108398438, 0.7563934326171875, 0.7910232543945312, 0.825653076171875, 0.8602828979492188, 0.8949127197265625, 0.9295425415039062, 0.96417236328125, 0.9988021850585938, 1.0334320068359375, 1.0680618286132812, 1.102691650390625, 1.1373214721679688, 1.1719512939453125, 1.2065811157226562, 1.2412109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 9.0, 5.0, 11.0, 12.0, 14.0, 17.0, 29.0, 20.0, 38.0, 44.0, 50.0, 48.0, 55.0, 59.0, 60.0, 59.0, 47.0, 58.0, 48.0, 46.0, 43.0, 47.0, 32.0, 30.0, 33.0, 16.0, 9.0, 20.0, 11.0, 3.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.20703125, -0.20101547241210938, -0.19499969482421875, -0.18898391723632812, -0.1829681396484375, -0.17695236206054688, -0.17093658447265625, -0.16492080688476562, -0.158905029296875, -0.15288925170898438, -0.14687347412109375, -0.14085769653320312, -0.1348419189453125, -0.12882614135742188, -0.12281036376953125, -0.11679458618164062, -0.11077880859375, -0.10476303100585938, -0.09874725341796875, -0.09273147583007812, -0.0867156982421875, -0.08069992065429688, -0.07468414306640625, -0.06866836547851562, -0.062652587890625, -0.056636810302734375, -0.05062103271484375, -0.044605255126953125, -0.0385894775390625, -0.032573699951171875, -0.02655792236328125, -0.020542144775390625, -0.0145263671875, -0.008510589599609375, -0.00249481201171875, 0.003520965576171875, 0.0095367431640625, 0.015552520751953125, 0.02156829833984375, 0.027584075927734375, 0.033599853515625, 0.039615631103515625, 0.04563140869140625, 0.051647186279296875, 0.0576629638671875, 0.06367874145507812, 0.06969451904296875, 0.07571029663085938, 0.08172607421875, 0.08774185180664062, 0.09375762939453125, 0.09977340698242188, 0.1057891845703125, 0.11180496215820312, 0.11782073974609375, 0.12383651733398438, 0.129852294921875, 0.13586807250976562, 0.14188385009765625, 0.14789962768554688, 0.1539154052734375, 0.15993118286132812, 0.16594696044921875, 0.17196273803710938, 0.177978515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 15.0, 27.0, 28.0, 50.0, 73.0, 102.0, 178.0, 263.0, 406.0, 635.0, 1149.0, 2147.0, 4057.0, 8680.0, 19941.0, 48090.0, 114375.0, 242763.0, 298564.0, 174802.0, 75024.0, 31041.0, 13370.0, 6021.0, 2863.0, 1540.0, 871.0, 501.0, 342.0, 202.0, 115.0, 87.0, 62.0, 57.0, 36.0, 23.0, 11.0, 13.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64501953125, -0.6267242431640625, -0.608428955078125, -0.5901336669921875, -0.57183837890625, -0.5535430908203125, -0.535247802734375, -0.5169525146484375, -0.4986572265625, -0.4803619384765625, -0.462066650390625, -0.4437713623046875, -0.42547607421875, -0.4071807861328125, -0.388885498046875, -0.3705902099609375, -0.352294921875, -0.3339996337890625, -0.315704345703125, -0.2974090576171875, -0.27911376953125, -0.2608184814453125, -0.242523193359375, -0.2242279052734375, -0.2059326171875, -0.1876373291015625, -0.169342041015625, -0.1510467529296875, -0.13275146484375, -0.1144561767578125, -0.096160888671875, -0.0778656005859375, -0.0595703125, -0.0412750244140625, -0.022979736328125, -0.0046844482421875, 0.01361083984375, 0.0319061279296875, 0.050201416015625, 0.0684967041015625, 0.0867919921875, 0.1050872802734375, 0.123382568359375, 0.1416778564453125, 0.15997314453125, 0.1782684326171875, 0.196563720703125, 0.2148590087890625, 0.233154296875, 0.2514495849609375, 0.269744873046875, 0.2880401611328125, 0.30633544921875, 0.3246307373046875, 0.342926025390625, 0.3612213134765625, 0.3795166015625, 0.3978118896484375, 0.416107177734375, 0.4344024658203125, 0.45269775390625, 0.4709930419921875, 0.489288330078125, 0.5075836181640625, 0.52587890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 9.0, 7.0, 6.0, 6.0, 10.0, 18.0, 22.0, 17.0, 21.0, 28.0, 26.0, 37.0, 45.0, 42.0, 48.0, 36.0, 55.0, 30.0, 36.0, 48.0, 50.0, 43.0, 46.0, 57.0, 29.0, 37.0, 34.0, 24.0, 22.0, 18.0, 18.0, 10.0, 10.0, 14.0, 7.0, 8.0, 7.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.74267578125, -0.7205734252929688, -0.6984710693359375, -0.6763687133789062, -0.654266357421875, -0.6321640014648438, -0.6100616455078125, -0.5879592895507812, -0.56585693359375, -0.5437545776367188, -0.5216522216796875, -0.49954986572265625, -0.477447509765625, -0.45534515380859375, -0.4332427978515625, -0.41114044189453125, -0.3890380859375, -0.36693572998046875, -0.3448333740234375, -0.32273101806640625, -0.300628662109375, -0.27852630615234375, -0.2564239501953125, -0.23432159423828125, -0.21221923828125, -0.19011688232421875, -0.1680145263671875, -0.14591217041015625, -0.123809814453125, -0.10170745849609375, -0.0796051025390625, -0.05750274658203125, -0.035400390625, -0.01329803466796875, 0.0088043212890625, 0.03090667724609375, 0.053009033203125, 0.07511138916015625, 0.0972137451171875, 0.11931610107421875, 0.14141845703125, 0.16352081298828125, 0.1856231689453125, 0.20772552490234375, 0.229827880859375, 0.25193023681640625, 0.2740325927734375, 0.29613494873046875, 0.3182373046875, 0.34033966064453125, 0.3624420166015625, 0.38454437255859375, 0.406646728515625, 0.42874908447265625, 0.4508514404296875, 0.47295379638671875, 0.49505615234375, 0.5171585083007812, 0.5392608642578125, 0.5613632202148438, 0.583465576171875, 0.6055679321289062, 0.6276702880859375, 0.6497726440429688, 0.671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 14.0, 10.0, 14.0, 33.0, 78.0, 126.0, 237.0, 518.0, 1349.0, 5303.0, 30098.0, 255831.0, 635507.0, 101238.0, 13732.0, 2859.0, 882.0, 340.0, 176.0, 109.0, 44.0, 23.0, 14.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64501953125, -0.6244049072265625, -0.603790283203125, -0.5831756591796875, -0.56256103515625, -0.5419464111328125, -0.521331787109375, -0.5007171630859375, -0.4801025390625, -0.4594879150390625, -0.438873291015625, -0.4182586669921875, -0.39764404296875, -0.3770294189453125, -0.356414794921875, -0.3358001708984375, -0.315185546875, -0.2945709228515625, -0.273956298828125, -0.2533416748046875, -0.23272705078125, -0.2121124267578125, -0.191497802734375, -0.1708831787109375, -0.1502685546875, -0.1296539306640625, -0.109039306640625, -0.0884246826171875, -0.06781005859375, -0.0471954345703125, -0.026580810546875, -0.0059661865234375, 0.0146484375, 0.0352630615234375, 0.055877685546875, 0.0764923095703125, 0.09710693359375, 0.1177215576171875, 0.138336181640625, 0.1589508056640625, 0.1795654296875, 0.2001800537109375, 0.220794677734375, 0.2414093017578125, 0.26202392578125, 0.2826385498046875, 0.303253173828125, 0.3238677978515625, 0.344482421875, 0.3650970458984375, 0.385711669921875, 0.4063262939453125, 0.42694091796875, 0.4475555419921875, 0.468170166015625, 0.4887847900390625, 0.5093994140625, 0.5300140380859375, 0.550628662109375, 0.5712432861328125, 0.59185791015625, 0.6124725341796875, 0.633087158203125, 0.6537017822265625, 0.67431640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 5.0, 5.0, 6.0, 6.0, 12.0, 20.0, 23.0, 23.0, 29.0, 41.0, 53.0, 50.0, 77.0, 57.0, 74.0, 81.0, 86.0, 73.0, 64.0, 42.0, 37.0, 26.0, 24.0, 15.0, 10.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.790327072143555e-05, -7.561780512332916e-05, -7.333233952522278e-05, -7.10468739271164e-05, -6.876140832901001e-05, -6.647594273090363e-05, -6.419047713279724e-05, -6.190501153469086e-05, -5.961954593658447e-05, -5.733408033847809e-05, -5.5048614740371704e-05, -5.276314914226532e-05, -5.0477683544158936e-05, -4.819221794605255e-05, -4.590675234794617e-05, -4.362128674983978e-05, -4.13358211517334e-05, -3.9050355553627014e-05, -3.676488995552063e-05, -3.4479424357414246e-05, -3.219395875930786e-05, -2.9908493161201477e-05, -2.7623027563095093e-05, -2.533756196498871e-05, -2.3052096366882324e-05, -2.076663076877594e-05, -1.8481165170669556e-05, -1.619569957256317e-05, -1.3910233974456787e-05, -1.1624768376350403e-05, -9.339302778244019e-06, -7.053837180137634e-06, -4.76837158203125e-06, -2.4829059839248657e-06, -1.9744038581848145e-07, 2.088025212287903e-06, 4.373490810394287e-06, 6.658956408500671e-06, 8.944422006607056e-06, 1.122988760471344e-05, 1.3515353202819824e-05, 1.580081880092621e-05, 1.8086284399032593e-05, 2.0371749997138977e-05, 2.265721559524536e-05, 2.4942681193351746e-05, 2.722814679145813e-05, 2.9513612389564514e-05, 3.17990779876709e-05, 3.408454358577728e-05, 3.637000918388367e-05, 3.865547478199005e-05, 4.0940940380096436e-05, 4.322640597820282e-05, 4.5511871576309204e-05, 4.779733717441559e-05, 5.008280277252197e-05, 5.236826837062836e-05, 5.465373396873474e-05, 5.6939199566841125e-05, 5.922466516494751e-05, 6.15101307630539e-05, 6.379559636116028e-05, 6.608106195926666e-05, 6.836652755737305e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 13.0, 14.0, 27.0, 33.0, 67.0, 84.0, 135.0, 238.0, 448.0, 762.0, 1680.0, 3832.0, 9817.0, 27181.0, 80346.0, 246079.0, 402461.0, 182511.0, 59199.0, 20181.0, 7518.0, 2953.0, 1407.0, 695.0, 353.0, 205.0, 113.0, 69.0, 32.0, 39.0, 16.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3266181945800781, -0.31510162353515625, -0.3035850524902344, -0.2920684814453125, -0.2805519104003906, -0.26903533935546875, -0.2575187683105469, -0.246002197265625, -0.23448562622070312, -0.22296905517578125, -0.21145248413085938, -0.1999359130859375, -0.18841934204101562, -0.17690277099609375, -0.16538619995117188, -0.15386962890625, -0.14235305786132812, -0.13083648681640625, -0.11931991577148438, -0.1078033447265625, -0.09628677368164062, -0.08477020263671875, -0.07325363159179688, -0.061737060546875, -0.050220489501953125, -0.03870391845703125, -0.027187347412109375, -0.0156707763671875, -0.004154205322265625, 0.00736236572265625, 0.018878936767578125, 0.0303955078125, 0.041912078857421875, 0.05342864990234375, 0.06494522094726562, 0.0764617919921875, 0.08797836303710938, 0.09949493408203125, 0.11101150512695312, 0.122528076171875, 0.13404464721679688, 0.14556121826171875, 0.15707778930664062, 0.1685943603515625, 0.18011093139648438, 0.19162750244140625, 0.20314407348632812, 0.21466064453125, 0.22617721557617188, 0.23769378662109375, 0.24921035766601562, 0.2607269287109375, 0.2722434997558594, 0.28376007080078125, 0.2952766418457031, 0.306793212890625, 0.3183097839355469, 0.32982635498046875, 0.3413429260253906, 0.3528594970703125, 0.3643760681152344, 0.37589263916015625, 0.3874092102050781, 0.39892578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 10.0, 21.0, 24.0, 18.0, 19.0, 27.0, 41.0, 41.0, 52.0, 61.0, 68.0, 71.0, 83.0, 74.0, 54.0, 49.0, 42.0, 37.0, 34.0, 25.0, 25.0, 11.0, 21.0, 9.0, 11.0, 6.0, 8.0, 6.0, 2.0, 2.0, 5.0, 10.0, 0.0, 1.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4083213806152344, -0.39598846435546875, -0.3836555480957031, -0.3713226318359375, -0.3589897155761719, -0.34665679931640625, -0.3343238830566406, -0.321990966796875, -0.3096580505371094, -0.29732513427734375, -0.2849922180175781, -0.2726593017578125, -0.2603263854980469, -0.24799346923828125, -0.23566055297851562, -0.22332763671875, -0.21099472045898438, -0.19866180419921875, -0.18632888793945312, -0.1739959716796875, -0.16166305541992188, -0.14933013916015625, -0.13699722290039062, -0.124664306640625, -0.11233139038085938, -0.09999847412109375, -0.08766555786132812, -0.0753326416015625, -0.06299972534179688, -0.05066680908203125, -0.038333892822265625, -0.0260009765625, -0.013668060302734375, -0.00133514404296875, 0.010997772216796875, 0.0233306884765625, 0.035663604736328125, 0.04799652099609375, 0.060329437255859375, 0.072662353515625, 0.08499526977539062, 0.09732818603515625, 0.10966110229492188, 0.1219940185546875, 0.13432693481445312, 0.14665985107421875, 0.15899276733398438, 0.17132568359375, 0.18365859985351562, 0.19599151611328125, 0.20832443237304688, 0.2206573486328125, 0.23299026489257812, 0.24532318115234375, 0.2576560974121094, 0.269989013671875, 0.2823219299316406, 0.29465484619140625, 0.3069877624511719, 0.3193206787109375, 0.3316535949707031, 0.34398651123046875, 0.3563194274902344, 0.36865234375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 15.0, 18.0, 40.0, 72.0, 130.0, 177.0, 170.0, 152.0, 121.0, 50.0, 20.0, 19.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.444522857666016, -16.117935180664062, -15.79134750366211, -15.464759826660156, -15.138172149658203, -14.81158447265625, -14.484996795654297, -14.158409118652344, -13.83182144165039, -13.505233764648438, -13.178646087646484, -12.852058410644531, -12.525470733642578, -12.198883056640625, -11.872295379638672, -11.545707702636719, -11.219120979309082, -10.892533302307129, -10.565945625305176, -10.239357948303223, -9.91277027130127, -9.586182594299316, -9.259594917297363, -8.933008193969727, -8.606420516967773, -8.27983283996582, -7.953245162963867, -7.626657485961914, -7.300069808959961, -6.973482131958008, -6.646894931793213, -6.32030725479126, -5.993719100952148, -5.667131423950195, -5.340543746948242, -5.013956069946289, -4.687368392944336, -4.360780715942383, -4.034193515777588, -3.7076058387756348, -3.3810181617736816, -3.0544304847717285, -2.7278428077697754, -2.4012553691864014, -2.0746676921844482, -1.7480800151824951, -1.4214924573898315, -1.094904899597168, -0.7683172225952148, -0.4417296051979065, -0.11514198780059814, 0.2114456295967102, 0.5380332469940186, 0.8646209239959717, 1.1912084817886353, 1.5177960395812988, 1.844383716583252, 2.170971393585205, 2.497559070587158, 2.8241465091705322, 3.1507341861724854, 3.4773218631744385, 3.8039093017578125, 4.130496978759766, 4.457084655761719]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 12.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 23.0, 25.0, 38.0, 25.0, 36.0, 42.0, 48.0, 38.0, 55.0, 45.0, 55.0, 54.0, 37.0, 55.0, 38.0, 46.0, 36.0, 35.0, 25.0, 17.0, 33.0, 18.0, 11.0, 15.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.402034759521484, -4.275336265563965, -4.148637294769287, -4.021938800811768, -3.895240068435669, -3.7685413360595703, -3.641842842102051, -3.515144109725952, -3.3884453773498535, -3.261746644973755, -3.1350479125976562, -3.0083494186401367, -2.881650686264038, -2.7549519538879395, -2.62825345993042, -2.5015547275543213, -2.3748559951782227, -2.248157262802124, -2.1214585304260254, -1.9947600364685059, -1.8680613040924072, -1.7413625717163086, -1.6146639585494995, -1.4879653453826904, -1.3612666130065918, -1.2345678806304932, -1.107869267463684, -0.9811705946922302, -0.8544719219207764, -0.7277732491493225, -0.6010745763778687, -0.4743759036064148, -0.34767723083496094, -0.22097855806350708, -0.09427988529205322, 0.032418787479400635, 0.1591174602508545, 0.28581613302230835, 0.4125148057937622, 0.5392134785652161, 0.6659121513366699, 0.7926108241081238, 0.9193094968795776, 1.0460081100463867, 1.1727068424224854, 1.299405574798584, 1.426104187965393, 1.5528028011322021, 1.6795015335083008, 1.8062002658843994, 1.9328988790512085, 2.0595974922180176, 2.186296224594116, 2.312994956970215, 2.4396934509277344, 2.566392183303833, 2.6930909156799316, 2.8197896480560303, 2.946488380432129, 3.0731868743896484, 3.199885606765747, 3.3265843391418457, 3.4532828330993652, 3.579981565475464, 3.7066802978515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 14.0, 22.0, 25.0, 46.0, 80.0, 134.0, 245.0, 534.0, 1488.0, 4394.0, 18324.0, 139865.0, 3822677.0, 177738.0, 21159.0, 4921.0, 1547.0, 538.0, 225.0, 106.0, 63.0, 41.0, 18.0, 14.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.34759521484375, -1.2850341796875, -1.22247314453125, -1.159912109375, -1.09735107421875, -1.0347900390625, -0.97222900390625, -0.90966796875, -0.84710693359375, -0.7845458984375, -0.72198486328125, -0.659423828125, -0.59686279296875, -0.5343017578125, -0.47174072265625, -0.4091796875, -0.34661865234375, -0.2840576171875, -0.22149658203125, -0.158935546875, -0.09637451171875, -0.0338134765625, 0.02874755859375, 0.09130859375, 0.15386962890625, 0.2164306640625, 0.27899169921875, 0.341552734375, 0.40411376953125, 0.4666748046875, 0.52923583984375, 0.591796875, 0.65435791015625, 0.7169189453125, 0.77947998046875, 0.842041015625, 0.90460205078125, 0.9671630859375, 1.02972412109375, 1.09228515625, 1.15484619140625, 1.2174072265625, 1.27996826171875, 1.342529296875, 1.40509033203125, 1.4676513671875, 1.53021240234375, 1.5927734375, 1.65533447265625, 1.7178955078125, 1.78045654296875, 1.843017578125, 1.90557861328125, 1.9681396484375, 2.03070068359375, 2.09326171875, 2.15582275390625, 2.2183837890625, 2.28094482421875, 2.343505859375, 2.40606689453125, 2.4686279296875, 2.53118896484375, 2.59375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 12.0, 10.0, 16.0, 16.0, 19.0, 21.0, 27.0, 23.0, 36.0, 47.0, 51.0, 48.0, 47.0, 63.0, 42.0, 53.0, 61.0, 47.0, 65.0, 40.0, 36.0, 33.0, 27.0, 30.0, 22.0, 22.0, 11.0, 17.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2069091796875, -0.20078468322753906, -0.19466018676757812, -0.1885356903076172, -0.18241119384765625, -0.1762866973876953, -0.17016220092773438, -0.16403770446777344, -0.1579132080078125, -0.15178871154785156, -0.14566421508789062, -0.1395397186279297, -0.13341522216796875, -0.1272907257080078, -0.12116622924804688, -0.11504173278808594, -0.108917236328125, -0.10279273986816406, -0.09666824340820312, -0.09054374694824219, -0.08441925048828125, -0.07829475402832031, -0.07217025756835938, -0.06604576110839844, -0.0599212646484375, -0.05379676818847656, -0.047672271728515625, -0.04154777526855469, -0.03542327880859375, -0.029298782348632812, -0.023174285888671875, -0.017049789428710938, -0.01092529296875, -0.0048007965087890625, 0.001323699951171875, 0.0074481964111328125, 0.01357269287109375, 0.019697189331054688, 0.025821685791015625, 0.03194618225097656, 0.0380706787109375, 0.04419517517089844, 0.050319671630859375, 0.05644416809082031, 0.06256866455078125, 0.06869316101074219, 0.07481765747070312, 0.08094215393066406, 0.087066650390625, 0.09319114685058594, 0.09931564331054688, 0.10544013977050781, 0.11156463623046875, 0.11768913269042969, 0.12381362915039062, 0.12993812561035156, 0.1360626220703125, 0.14218711853027344, 0.14831161499023438, 0.1544361114501953, 0.16056060791015625, 0.1666851043701172, 0.17280960083007812, 0.17893409729003906, 0.18505859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 7.0, 6.0, 13.0, 20.0, 20.0, 42.0, 46.0, 73.0, 109.0, 156.0, 251.0, 397.0, 571.0, 975.0, 1679.0, 3200.0, 6563.0, 16481.0, 53374.0, 298933.0, 3394356.0, 328770.0, 56471.0, 17268.0, 6765.0, 3281.0, 1654.0, 1040.0, 587.0, 410.0, 235.0, 168.0, 101.0, 74.0, 52.0, 38.0, 24.0, 19.0, 21.0, 7.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.3203125, -1.28314208984375, -1.2459716796875, -1.20880126953125, -1.171630859375, -1.13446044921875, -1.0972900390625, -1.06011962890625, -1.02294921875, -0.98577880859375, -0.9486083984375, -0.91143798828125, -0.874267578125, -0.83709716796875, -0.7999267578125, -0.76275634765625, -0.7255859375, -0.68841552734375, -0.6512451171875, -0.61407470703125, -0.576904296875, -0.53973388671875, -0.5025634765625, -0.46539306640625, -0.42822265625, -0.39105224609375, -0.3538818359375, -0.31671142578125, -0.279541015625, -0.24237060546875, -0.2052001953125, -0.16802978515625, -0.130859375, -0.09368896484375, -0.0565185546875, -0.01934814453125, 0.017822265625, 0.05499267578125, 0.0921630859375, 0.12933349609375, 0.16650390625, 0.20367431640625, 0.2408447265625, 0.27801513671875, 0.315185546875, 0.35235595703125, 0.3895263671875, 0.42669677734375, 0.4638671875, 0.50103759765625, 0.5382080078125, 0.57537841796875, 0.612548828125, 0.64971923828125, 0.6868896484375, 0.72406005859375, 0.76123046875, 0.79840087890625, 0.8355712890625, 0.87274169921875, 0.909912109375, 0.94708251953125, 0.9842529296875, 1.02142333984375, 1.05859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 4.0, 6.0, 9.0, 15.0, 22.0, 35.0, 58.0, 98.0, 202.0, 507.0, 1960.0, 610.0, 232.0, 107.0, 70.0, 34.0, 27.0, 17.0, 15.0, 7.0, 4.0, 8.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6225814819335938, -0.5991668701171875, -0.5757522583007812, -0.552337646484375, -0.5289230346679688, -0.5055084228515625, -0.48209381103515625, -0.45867919921875, -0.43526458740234375, -0.4118499755859375, -0.38843536376953125, -0.365020751953125, -0.34160614013671875, -0.3181915283203125, -0.29477691650390625, -0.2713623046875, -0.24794769287109375, -0.2245330810546875, -0.20111846923828125, -0.177703857421875, -0.15428924560546875, -0.1308746337890625, -0.10746002197265625, -0.08404541015625, -0.06063079833984375, -0.0372161865234375, -0.01380157470703125, 0.009613037109375, 0.03302764892578125, 0.0564422607421875, 0.07985687255859375, 0.103271484375, 0.12668609619140625, 0.1501007080078125, 0.17351531982421875, 0.196929931640625, 0.22034454345703125, 0.2437591552734375, 0.26717376708984375, 0.29058837890625, 0.31400299072265625, 0.3374176025390625, 0.36083221435546875, 0.384246826171875, 0.40766143798828125, 0.4310760498046875, 0.45449066162109375, 0.4779052734375, 0.5013198852539062, 0.5247344970703125, 0.5481491088867188, 0.571563720703125, 0.5949783325195312, 0.6183929443359375, 0.6418075561523438, 0.66522216796875, 0.6886367797851562, 0.7120513916015625, 0.7354660034179688, 0.758880615234375, 0.7822952270507812, 0.8057098388671875, 0.8291244506835938, 0.8525390625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 25.0, 45.0, 104.0, 173.0, 210.0, 186.0, 133.0, 56.0, 35.0, 13.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.316376686096191, -9.11625862121582, -8.91614055633545, -8.716022491455078, -8.515904426574707, -8.315786361694336, -8.115668296813965, -7.915550231933594, -7.715432167053223, -7.515314102172852, -7.3151960372924805, -7.115077972412109, -6.914959907531738, -6.714841842651367, -6.514723777770996, -6.314605712890625, -6.114487648010254, -5.914369583129883, -5.714251518249512, -5.514133453369141, -5.3140153884887695, -5.113897323608398, -4.913779258728027, -4.713661193847656, -4.513542652130127, -4.313424587249756, -4.113306522369385, -3.9131884574890137, -3.7130703926086426, -3.5129523277282715, -3.3128342628479004, -3.1127161979675293, -2.912598133087158, -2.712480068206787, -2.512362003326416, -2.312243938446045, -2.112125873565674, -1.9120076894760132, -1.711889624595642, -1.511771559715271, -1.3116534948349, -1.1115354299545288, -0.9114173650741577, -0.7112992405891418, -0.5111811757087708, -0.3110630512237549, -0.11094498634338379, 0.0891730785369873, 0.2892911434173584, 0.4894092082977295, 0.6895272731781006, 0.8896453976631165, 1.0897634029388428, 1.2898815870285034, 1.4899996519088745, 1.6901177167892456, 1.8902357816696167, 2.0903539657592773, 2.2904720306396484, 2.4905900955200195, 2.6907081604003906, 2.8908262252807617, 3.090944290161133, 3.291062355041504, 3.491180419921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 8.0, 9.0, 6.0, 9.0, 10.0, 9.0, 13.0, 16.0, 13.0, 30.0, 24.0, 42.0, 39.0, 37.0, 40.0, 38.0, 41.0, 52.0, 50.0, 60.0, 39.0, 43.0, 57.0, 38.0, 42.0, 40.0, 33.0, 28.0, 26.0, 20.0, 18.0, 14.0, 10.0, 6.0, 7.0, 8.0, 8.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3479976654052734, -2.280540943145752, -2.2130842208862305, -2.145627498626709, -2.0781707763671875, -2.010714054107666, -1.943257451057434, -1.8758007287979126, -1.8083441257476807, -1.7408874034881592, -1.6734306812286377, -1.6059739589691162, -1.5385173559188843, -1.4710606336593628, -1.4036039113998413, -1.3361471891403198, -1.2686904668807983, -1.2012337446212769, -1.1337770223617554, -1.0663204193115234, -0.998863697052002, -0.9314069747924805, -0.863950252532959, -0.7964935302734375, -0.7290368676185608, -0.6615801453590393, -0.5941234827041626, -0.5266667604446411, -0.459210067987442, -0.3917533755302429, -0.32429665327072144, -0.25683996081352234, -0.18938326835632324, -0.12192656844854355, -0.054469868540763855, 0.012986838817596436, 0.08044353127479553, 0.14790022373199463, 0.2153569459915161, 0.2828136384487152, 0.3502703309059143, 0.4177270233631134, 0.4851837158203125, 0.552640438079834, 0.6200971603393555, 0.6875538229942322, 0.7550105452537537, 0.8224672079086304, 0.8899239301681519, 0.9573806524276733, 1.0248373746871948, 1.0922939777374268, 1.1597506999969482, 1.2272074222564697, 1.2946641445159912, 1.3621208667755127, 1.4295775890350342, 1.4970343112945557, 1.5644910335540771, 1.6319477558135986, 1.6994043588638306, 1.766861081123352, 1.8343178033828735, 1.901774525642395, 1.969231128692627]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 18.0, 26.0, 32.0, 84.0, 138.0, 281.0, 580.0, 1493.0, 3890.0, 12242.0, 44563.0, 172722.0, 422165.0, 281007.0, 78609.0, 20694.0, 6165.0, 2159.0, 880.0, 388.0, 203.0, 84.0, 45.0, 29.0, 17.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8815383911132812, -0.8368072509765625, -0.7920761108398438, -0.747344970703125, -0.7026138305664062, -0.6578826904296875, -0.6131515502929688, -0.56842041015625, -0.5236892700195312, -0.4789581298828125, -0.43422698974609375, -0.389495849609375, -0.34476470947265625, -0.3000335693359375, -0.25530242919921875, -0.2105712890625, -0.16584014892578125, -0.1211090087890625, -0.07637786865234375, -0.031646728515625, 0.01308441162109375, 0.0578155517578125, 0.10254669189453125, 0.14727783203125, 0.19200897216796875, 0.2367401123046875, 0.28147125244140625, 0.326202392578125, 0.37093353271484375, 0.4156646728515625, 0.46039581298828125, 0.505126953125, 0.5498580932617188, 0.5945892333984375, 0.6393203735351562, 0.684051513671875, 0.7287826538085938, 0.7735137939453125, 0.8182449340820312, 0.86297607421875, 0.9077072143554688, 0.9524383544921875, 0.9971694946289062, 1.041900634765625, 1.0866317749023438, 1.1313629150390625, 1.1760940551757812, 1.2208251953125, 1.2655563354492188, 1.3102874755859375, 1.3550186157226562, 1.399749755859375, 1.4444808959960938, 1.4892120361328125, 1.5339431762695312, 1.57867431640625, 1.6234054565429688, 1.6681365966796875, 1.7128677368164062, 1.757598876953125, 1.8023300170898438, 1.8470611572265625, 1.8917922973632812, 1.9365234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 10.0, 9.0, 10.0, 22.0, 18.0, 16.0, 30.0, 36.0, 37.0, 39.0, 57.0, 49.0, 51.0, 62.0, 56.0, 48.0, 65.0, 54.0, 52.0, 41.0, 49.0, 38.0, 32.0, 29.0, 14.0, 14.0, 12.0, 7.0, 13.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.315673828125, -0.30750274658203125, -0.2993316650390625, -0.29116058349609375, -0.282989501953125, -0.27481842041015625, -0.2666473388671875, -0.25847625732421875, -0.25030517578125, -0.24213409423828125, -0.2339630126953125, -0.22579193115234375, -0.217620849609375, -0.20944976806640625, -0.2012786865234375, -0.19310760498046875, -0.1849365234375, -0.17676544189453125, -0.1685943603515625, -0.16042327880859375, -0.152252197265625, -0.14408111572265625, -0.1359100341796875, -0.12773895263671875, -0.11956787109375, -0.11139678955078125, -0.1032257080078125, -0.09505462646484375, -0.086883544921875, -0.07871246337890625, -0.0705413818359375, -0.06237030029296875, -0.05419921875, -0.04602813720703125, -0.0378570556640625, -0.02968597412109375, -0.021514892578125, -0.01334381103515625, -0.0051727294921875, 0.00299835205078125, 0.01116943359375, 0.01934051513671875, 0.0275115966796875, 0.03568267822265625, 0.043853759765625, 0.05202484130859375, 0.0601959228515625, 0.06836700439453125, 0.0765380859375, 0.08470916748046875, 0.0928802490234375, 0.10105133056640625, 0.109222412109375, 0.11739349365234375, 0.1255645751953125, 0.13373565673828125, 0.14190673828125, 0.15007781982421875, 0.1582489013671875, 0.16641998291015625, 0.174591064453125, 0.18276214599609375, 0.1909332275390625, 0.19910430908203125, 0.207275390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 11.0, 10.0, 23.0, 16.0, 31.0, 45.0, 78.0, 96.0, 159.0, 256.0, 402.0, 610.0, 1158.0, 2028.0, 3846.0, 7894.0, 17072.0, 39619.0, 95452.0, 218615.0, 314615.0, 196789.0, 84295.0, 35041.0, 15334.0, 7058.0, 3562.0, 1904.0, 1018.0, 544.0, 352.0, 217.0, 135.0, 66.0, 65.0, 48.0, 27.0, 16.0, 20.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.89013671875, -0.8626861572265625, -0.835235595703125, -0.8077850341796875, -0.78033447265625, -0.7528839111328125, -0.725433349609375, -0.6979827880859375, -0.6705322265625, -0.6430816650390625, -0.615631103515625, -0.5881805419921875, -0.56072998046875, -0.5332794189453125, -0.505828857421875, -0.4783782958984375, -0.450927734375, -0.4234771728515625, -0.396026611328125, -0.3685760498046875, -0.34112548828125, -0.3136749267578125, -0.286224365234375, -0.2587738037109375, -0.2313232421875, -0.2038726806640625, -0.176422119140625, -0.1489715576171875, -0.12152099609375, -0.0940704345703125, -0.066619873046875, -0.0391693115234375, -0.01171875, 0.0157318115234375, 0.043182373046875, 0.0706329345703125, 0.09808349609375, 0.1255340576171875, 0.152984619140625, 0.1804351806640625, 0.2078857421875, 0.2353363037109375, 0.262786865234375, 0.2902374267578125, 0.31768798828125, 0.3451385498046875, 0.372589111328125, 0.4000396728515625, 0.427490234375, 0.4549407958984375, 0.482391357421875, 0.5098419189453125, 0.53729248046875, 0.5647430419921875, 0.592193603515625, 0.6196441650390625, 0.6470947265625, 0.6745452880859375, 0.701995849609375, 0.7294464111328125, 0.75689697265625, 0.7843475341796875, 0.811798095703125, 0.8392486572265625, 0.86669921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 3.0, 13.0, 11.0, 10.0, 12.0, 17.0, 21.0, 18.0, 24.0, 27.0, 19.0, 43.0, 40.0, 48.0, 60.0, 45.0, 39.0, 55.0, 48.0, 37.0, 50.0, 36.0, 41.0, 36.0, 29.0, 25.0, 32.0, 23.0, 20.0, 19.0, 15.0, 15.0, 16.0, 7.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.2734375, -1.2375640869140625, -1.201690673828125, -1.1658172607421875, -1.12994384765625, -1.0940704345703125, -1.058197021484375, -1.0223236083984375, -0.9864501953125, -0.9505767822265625, -0.914703369140625, -0.8788299560546875, -0.84295654296875, -0.8070831298828125, -0.771209716796875, -0.7353363037109375, -0.699462890625, -0.6635894775390625, -0.627716064453125, -0.5918426513671875, -0.55596923828125, -0.5200958251953125, -0.484222412109375, -0.4483489990234375, -0.4124755859375, -0.3766021728515625, -0.340728759765625, -0.3048553466796875, -0.26898193359375, -0.2331085205078125, -0.197235107421875, -0.1613616943359375, -0.12548828125, -0.0896148681640625, -0.053741455078125, -0.0178680419921875, 0.01800537109375, 0.0538787841796875, 0.089752197265625, 0.1256256103515625, 0.1614990234375, 0.1973724365234375, 0.233245849609375, 0.2691192626953125, 0.30499267578125, 0.3408660888671875, 0.376739501953125, 0.4126129150390625, 0.448486328125, 0.4843597412109375, 0.520233154296875, 0.5561065673828125, 0.59197998046875, 0.6278533935546875, 0.663726806640625, 0.6996002197265625, 0.7354736328125, 0.7713470458984375, 0.807220458984375, 0.8430938720703125, 0.87896728515625, 0.9148406982421875, 0.950714111328125, 0.9865875244140625, 1.0224609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 14.0, 4.0, 10.0, 10.0, 19.0, 29.0, 35.0, 50.0, 78.0, 123.0, 173.0, 247.0, 447.0, 778.0, 1644.0, 3974.0, 11085.0, 39030.0, 178669.0, 519276.0, 223564.0, 47630.0, 13135.0, 4435.0, 1892.0, 877.0, 462.0, 297.0, 160.0, 115.0, 80.0, 55.0, 43.0, 29.0, 17.0, 15.0, 16.0, 8.0, 6.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.76934814453125, -0.7457275390625, -0.72210693359375, -0.698486328125, -0.67486572265625, -0.6512451171875, -0.62762451171875, -0.60400390625, -0.58038330078125, -0.5567626953125, -0.53314208984375, -0.509521484375, -0.48590087890625, -0.4622802734375, -0.43865966796875, -0.4150390625, -0.39141845703125, -0.3677978515625, -0.34417724609375, -0.320556640625, -0.29693603515625, -0.2733154296875, -0.24969482421875, -0.22607421875, -0.20245361328125, -0.1788330078125, -0.15521240234375, -0.131591796875, -0.10797119140625, -0.0843505859375, -0.06072998046875, -0.037109375, -0.01348876953125, 0.0101318359375, 0.03375244140625, 0.057373046875, 0.08099365234375, 0.1046142578125, 0.12823486328125, 0.15185546875, 0.17547607421875, 0.1990966796875, 0.22271728515625, 0.246337890625, 0.26995849609375, 0.2935791015625, 0.31719970703125, 0.3408203125, 0.36444091796875, 0.3880615234375, 0.41168212890625, 0.435302734375, 0.45892333984375, 0.4825439453125, 0.50616455078125, 0.52978515625, 0.55340576171875, 0.5770263671875, 0.60064697265625, 0.624267578125, 0.64788818359375, 0.6715087890625, 0.69512939453125, 0.71875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 9.0, 11.0, 17.0, 5.0, 24.0, 45.0, 60.0, 75.0, 98.0, 110.0, 109.0, 105.0, 79.0, 72.0, 53.0, 49.0, 26.0, 24.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00021409988403320312, -0.0002090558409690857, -0.00020401179790496826, -0.00019896775484085083, -0.0001939237117767334, -0.00018887966871261597, -0.00018383562564849854, -0.0001787915825843811, -0.00017374753952026367, -0.00016870349645614624, -0.0001636594533920288, -0.00015861541032791138, -0.00015357136726379395, -0.00014852732419967651, -0.00014348328113555908, -0.00013843923807144165, -0.00013339519500732422, -0.0001283511519432068, -0.00012330710887908936, -0.00011826306581497192, -0.00011321902275085449, -0.00010817497968673706, -0.00010313093662261963, -9.80868935585022e-05, -9.304285049438477e-05, -8.799880743026733e-05, -8.29547643661499e-05, -7.791072130203247e-05, -7.286667823791504e-05, -6.782263517379761e-05, -6.277859210968018e-05, -5.7734549045562744e-05, -5.269050598144531e-05, -4.764646291732788e-05, -4.260241985321045e-05, -3.755837678909302e-05, -3.2514333724975586e-05, -2.7470290660858154e-05, -2.2426247596740723e-05, -1.738220453262329e-05, -1.233816146850586e-05, -7.294118404388428e-06, -2.250075340270996e-06, 2.7939677238464355e-06, 7.838010787963867e-06, 1.2882053852081299e-05, 1.792609691619873e-05, 2.2970139980316162e-05, 2.8014183044433594e-05, 3.3058226108551025e-05, 3.810226917266846e-05, 4.314631223678589e-05, 4.819035530090332e-05, 5.323439836502075e-05, 5.8278441429138184e-05, 6.332248449325562e-05, 6.836652755737305e-05, 7.341057062149048e-05, 7.845461368560791e-05, 8.349865674972534e-05, 8.854269981384277e-05, 9.35867428779602e-05, 9.863078594207764e-05, 0.00010367482900619507, 0.0001087188720703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 9.0, 10.0, 22.0, 22.0, 37.0, 43.0, 90.0, 108.0, 154.0, 286.0, 503.0, 925.0, 1887.0, 4525.0, 12544.0, 44087.0, 183312.0, 464469.0, 248054.0, 60320.0, 16660.0, 5696.0, 2286.0, 1068.0, 544.0, 295.0, 196.0, 126.0, 70.0, 53.0, 41.0, 28.0, 28.0, 11.0, 13.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5871353149414062, -0.5658721923828125, -0.5446090698242188, -0.523345947265625, -0.5020828247070312, -0.4808197021484375, -0.45955657958984375, -0.43829345703125, -0.41703033447265625, -0.3957672119140625, -0.37450408935546875, -0.353240966796875, -0.33197784423828125, -0.3107147216796875, -0.28945159912109375, -0.2681884765625, -0.24692535400390625, -0.2256622314453125, -0.20439910888671875, -0.183135986328125, -0.16187286376953125, -0.1406097412109375, -0.11934661865234375, -0.09808349609375, -0.07682037353515625, -0.0555572509765625, -0.03429412841796875, -0.013031005859375, 0.00823211669921875, 0.0294952392578125, 0.05075836181640625, 0.072021484375, 0.09328460693359375, 0.1145477294921875, 0.13581085205078125, 0.157073974609375, 0.17833709716796875, 0.1996002197265625, 0.22086334228515625, 0.24212646484375, 0.26338958740234375, 0.2846527099609375, 0.30591583251953125, 0.327178955078125, 0.34844207763671875, 0.3697052001953125, 0.39096832275390625, 0.4122314453125, 0.43349456787109375, 0.4547576904296875, 0.47602081298828125, 0.497283935546875, 0.5185470581054688, 0.5398101806640625, 0.5610733032226562, 0.58233642578125, 0.6035995483398438, 0.6248626708984375, 0.6461257934570312, 0.667388916015625, 0.6886520385742188, 0.7099151611328125, 0.7311782836914062, 0.75244140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 7.0, 13.0, 11.0, 13.0, 22.0, 29.0, 22.0, 34.0, 38.0, 44.0, 68.0, 69.0, 67.0, 67.0, 69.0, 71.0, 65.0, 39.0, 45.0, 41.0, 29.0, 19.0, 10.0, 14.0, 12.0, 10.0, 7.0, 7.0, 2.0, 4.0, 7.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.74560546875, -0.7225341796875, -0.699462890625, -0.6763916015625, -0.6533203125, -0.6302490234375, -0.607177734375, -0.5841064453125, -0.56103515625, -0.5379638671875, -0.514892578125, -0.4918212890625, -0.46875, -0.4456787109375, -0.422607421875, -0.3995361328125, -0.37646484375, -0.3533935546875, -0.330322265625, -0.3072509765625, -0.2841796875, -0.2611083984375, -0.238037109375, -0.2149658203125, -0.19189453125, -0.1688232421875, -0.145751953125, -0.1226806640625, -0.099609375, -0.0765380859375, -0.053466796875, -0.0303955078125, -0.00732421875, 0.0157470703125, 0.038818359375, 0.0618896484375, 0.0849609375, 0.1080322265625, 0.131103515625, 0.1541748046875, 0.17724609375, 0.2003173828125, 0.223388671875, 0.2464599609375, 0.26953125, 0.2926025390625, 0.315673828125, 0.3387451171875, 0.36181640625, 0.3848876953125, 0.407958984375, 0.4310302734375, 0.4541015625, 0.4771728515625, 0.500244140625, 0.5233154296875, 0.54638671875, 0.5694580078125, 0.592529296875, 0.6156005859375, 0.638671875, 0.6617431640625, 0.684814453125, 0.7078857421875, 0.73095703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 13.0, 9.0, 16.0, 21.0, 23.0, 38.0, 52.0, 58.0, 64.0, 91.0, 110.0, 95.0, 96.0, 75.0, 80.0, 45.0, 29.0, 26.0, 19.0, 13.0, 6.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.674462795257568, -7.398504257202148, -7.12254524230957, -6.84658670425415, -6.5706281661987305, -6.2946696281433105, -6.018711090087891, -5.7427520751953125, -5.466793537139893, -5.190834999084473, -4.9148759841918945, -4.638917446136475, -4.362958908081055, -4.087000370025635, -3.8110415935516357, -3.5350828170776367, -3.259124279022217, -2.983165740966797, -2.707206964492798, -2.431248188018799, -2.155289649963379, -1.8793309926986694, -1.60337233543396, -1.3274136781692505, -1.051455020904541, -0.7754963636398315, -0.49953770637512207, -0.2235790491104126, 0.052379608154296875, 0.32833826541900635, 0.6042969226837158, 0.8802555799484253, 1.1562137603759766, 1.432172417640686, 1.7081310749053955, 1.984089732170105, 2.2600483894348145, 2.5360069274902344, 2.8119657039642334, 3.0879244804382324, 3.3638830184936523, 3.6398415565490723, 3.9158003330230713, 4.19175910949707, 4.46771764755249, 4.74367618560791, 5.019635200500488, 5.295593738555908, 5.571552276611328, 5.847510814666748, 6.123469352722168, 6.399428367614746, 6.675386905670166, 6.951345443725586, 7.227304458618164, 7.503262996673584, 7.779221534729004, 8.055180549621582, 8.331138610839844, 8.607097625732422, 8.883056640625, 9.159014701843262, 9.43497371673584, 9.710931777954102, 9.98689079284668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 13.0, 15.0, 16.0, 18.0, 28.0, 30.0, 43.0, 42.0, 33.0, 40.0, 47.0, 38.0, 52.0, 51.0, 48.0, 50.0, 51.0, 48.0, 47.0, 31.0, 24.0, 39.0, 25.0, 24.0, 19.0, 27.0, 14.0, 18.0, 16.0, 10.0, 11.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42227029800415, -6.211087703704834, -5.999905586242676, -5.788722991943359, -5.577540397644043, -5.366357803344727, -5.155175685882568, -4.943993091583252, -4.7328104972839355, -4.521627902984619, -4.310445785522461, -4.0992631912231445, -3.888080596923828, -3.676898241043091, -3.4657158851623535, -3.254533290863037, -3.0433509349823, -2.8321685791015625, -2.620985984802246, -2.409803628921509, -2.1986210346221924, -1.987438678741455, -1.7762562036514282, -1.5650737285614014, -1.3538912534713745, -1.1427087783813477, -0.9315263032913208, -0.7203438878059387, -0.5091614127159119, -0.2979789972305298, -0.08679652214050293, 0.12438595294952393, 0.3355684280395508, 0.5467509031295776, 0.7579333782196045, 0.9691157937049866, 1.1802983283996582, 1.3914806842803955, 1.6026631593704224, 1.8138456344604492, 2.0250282287597656, 2.236210584640503, 2.4473931789398193, 2.6585755348205566, 2.869758129119873, 3.0809404850006104, 3.2921228408813477, 3.503305435180664, 3.7144877910614014, 3.9256701469421387, 4.136852741241455, 4.3480353355407715, 4.55921745300293, 4.770400047302246, 4.9815826416015625, 5.192765235900879, 5.403947353363037, 5.6151299476623535, 5.826312065124512, 6.037494659423828, 6.2486772537231445, 6.459859848022461, 6.671041965484619, 6.8822245597839355, 7.093407154083252]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 8.0, 6.0, 16.0, 14.0, 30.0, 31.0, 64.0, 86.0, 107.0, 212.0, 317.0, 636.0, 1266.0, 2709.0, 6774.0, 21637.0, 188841.0, 3914834.0, 39646.0, 9733.0, 3685.0, 1679.0, 843.0, 443.0, 246.0, 139.0, 89.0, 67.0, 46.0, 19.0, 11.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7841796875, -1.726959228515625, -1.66973876953125, -1.612518310546875, -1.5552978515625, -1.498077392578125, -1.44085693359375, -1.383636474609375, -1.326416015625, -1.269195556640625, -1.21197509765625, -1.154754638671875, -1.0975341796875, -1.040313720703125, -0.98309326171875, -0.925872802734375, -0.86865234375, -0.811431884765625, -0.75421142578125, -0.696990966796875, -0.6397705078125, -0.582550048828125, -0.52532958984375, -0.468109130859375, -0.410888671875, -0.353668212890625, -0.29644775390625, -0.239227294921875, -0.1820068359375, -0.124786376953125, -0.06756591796875, -0.010345458984375, 0.046875, 0.104095458984375, 0.16131591796875, 0.218536376953125, 0.2757568359375, 0.332977294921875, 0.39019775390625, 0.447418212890625, 0.504638671875, 0.561859130859375, 0.61907958984375, 0.676300048828125, 0.7335205078125, 0.790740966796875, 0.84796142578125, 0.905181884765625, 0.96240234375, 1.019622802734375, 1.07684326171875, 1.134063720703125, 1.1912841796875, 1.248504638671875, 1.30572509765625, 1.362945556640625, 1.420166015625, 1.477386474609375, 1.53460693359375, 1.591827392578125, 1.6490478515625, 1.706268310546875, 1.76348876953125, 1.820709228515625, 1.8779296875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 19.0, 25.0, 19.0, 20.0, 37.0, 43.0, 33.0, 43.0, 51.0, 57.0, 45.0, 58.0, 62.0, 58.0, 48.0, 43.0, 64.0, 37.0, 34.0, 32.0, 28.0, 21.0, 19.0, 10.0, 17.0, 19.0, 7.0, 2.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3671875, -0.3572845458984375, -0.347381591796875, -0.3374786376953125, -0.32757568359375, -0.3176727294921875, -0.307769775390625, -0.2978668212890625, -0.2879638671875, -0.2780609130859375, -0.268157958984375, -0.2582550048828125, -0.24835205078125, -0.2384490966796875, -0.228546142578125, -0.2186431884765625, -0.208740234375, -0.1988372802734375, -0.188934326171875, -0.1790313720703125, -0.16912841796875, -0.1592254638671875, -0.149322509765625, -0.1394195556640625, -0.1295166015625, -0.1196136474609375, -0.109710693359375, -0.0998077392578125, -0.08990478515625, -0.0800018310546875, -0.070098876953125, -0.0601959228515625, -0.05029296875, -0.0403900146484375, -0.030487060546875, -0.0205841064453125, -0.01068115234375, -0.0007781982421875, 0.009124755859375, 0.0190277099609375, 0.0289306640625, 0.0388336181640625, 0.048736572265625, 0.0586395263671875, 0.06854248046875, 0.0784454345703125, 0.088348388671875, 0.0982513427734375, 0.108154296875, 0.1180572509765625, 0.127960205078125, 0.1378631591796875, 0.14776611328125, 0.1576690673828125, 0.167572021484375, 0.1774749755859375, 0.1873779296875, 0.1972808837890625, 0.207183837890625, 0.2170867919921875, 0.22698974609375, 0.2368927001953125, 0.246795654296875, 0.2566986083984375, 0.2666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 6.0, 8.0, 20.0, 20.0, 30.0, 49.0, 68.0, 86.0, 137.0, 201.0, 347.0, 453.0, 735.0, 1262.0, 2322.0, 4892.0, 12614.0, 51828.0, 3923668.0, 158905.0, 22028.0, 7153.0, 3198.0, 1563.0, 960.0, 606.0, 339.0, 241.0, 167.0, 129.0, 76.0, 43.0, 35.0, 28.0, 13.0, 9.0, 9.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.549072265625, -2.47119140625, -2.393310546875, -2.3154296875, -2.237548828125, -2.15966796875, -2.081787109375, -2.00390625, -1.926025390625, -1.84814453125, -1.770263671875, -1.6923828125, -1.614501953125, -1.53662109375, -1.458740234375, -1.380859375, -1.302978515625, -1.22509765625, -1.147216796875, -1.0693359375, -0.991455078125, -0.91357421875, -0.835693359375, -0.7578125, -0.679931640625, -0.60205078125, -0.524169921875, -0.4462890625, -0.368408203125, -0.29052734375, -0.212646484375, -0.134765625, -0.056884765625, 0.02099609375, 0.098876953125, 0.1767578125, 0.254638671875, 0.33251953125, 0.410400390625, 0.48828125, 0.566162109375, 0.64404296875, 0.721923828125, 0.7998046875, 0.877685546875, 0.95556640625, 1.033447265625, 1.111328125, 1.189208984375, 1.26708984375, 1.344970703125, 1.4228515625, 1.500732421875, 1.57861328125, 1.656494140625, 1.734375, 1.812255859375, 1.89013671875, 1.968017578125, 2.0458984375, 2.123779296875, 2.20166015625, 2.279541015625, 2.357421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 17.0, 25.0, 21.0, 58.0, 196.0, 3425.0, 193.0, 50.0, 28.0, 12.0, 9.0, 6.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6729583740234375, -0.651580810546875, -0.6302032470703125, -0.60882568359375, -0.5874481201171875, -0.566070556640625, -0.5446929931640625, -0.5233154296875, -0.5019378662109375, -0.480560302734375, -0.4591827392578125, -0.43780517578125, -0.4164276123046875, -0.395050048828125, -0.3736724853515625, -0.352294921875, -0.3309173583984375, -0.309539794921875, -0.2881622314453125, -0.26678466796875, -0.2454071044921875, -0.224029541015625, -0.2026519775390625, -0.1812744140625, -0.1598968505859375, -0.138519287109375, -0.1171417236328125, -0.09576416015625, -0.0743865966796875, -0.053009033203125, -0.0316314697265625, -0.01025390625, 0.0111236572265625, 0.032501220703125, 0.0538787841796875, 0.07525634765625, 0.0966339111328125, 0.118011474609375, 0.1393890380859375, 0.1607666015625, 0.1821441650390625, 0.203521728515625, 0.2248992919921875, 0.24627685546875, 0.2676544189453125, 0.289031982421875, 0.3104095458984375, 0.331787109375, 0.3531646728515625, 0.374542236328125, 0.3959197998046875, 0.41729736328125, 0.4386749267578125, 0.460052490234375, 0.4814300537109375, 0.5028076171875, 0.5241851806640625, 0.545562744140625, 0.5669403076171875, 0.58831787109375, 0.6096954345703125, 0.631072998046875, 0.6524505615234375, 0.673828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 11.0, 30.0, 36.0, 76.0, 156.0, 237.0, 205.0, 133.0, 66.0, 32.0, 13.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.628856658935547, -5.503933906555176, -5.379011631011963, -5.254088878631592, -5.129166603088379, -5.004243850708008, -4.879321575164795, -4.754398822784424, -4.629476547241211, -4.50455379486084, -4.379631519317627, -4.254708766937256, -4.129786491394043, -4.004863739013672, -3.87994122505188, -3.755018711090088, -3.630095958709717, -3.505173444747925, -3.380250930786133, -3.255328416824341, -3.130405902862549, -3.0054831504821777, -2.8805606365203857, -2.7556381225585938, -2.6307156085968018, -2.5057930946350098, -2.3808705806732178, -2.255948066711426, -2.1310253143310547, -2.006103038787842, -1.8811802864074707, -1.7562577724456787, -1.6313354969024658, -1.5064129829406738, -1.3814904689788818, -1.2565678358078003, -1.1316453218460083, -1.0067228078842163, -0.8818002343177795, -0.7568776607513428, -0.6319551467895508, -0.5070326328277588, -0.382110059261322, -0.25718751549720764, -0.13226497173309326, -0.0073424577713012695, 0.1175801157951355, 0.24250268936157227, 0.36742520332336426, 0.49234774708747864, 0.617270290851593, 0.7421928644180298, 0.8671153783798218, 0.9920378923416138, 1.1169605255126953, 1.2418830394744873, 1.3668055534362793, 1.4917280673980713, 1.6166505813598633, 1.7415732145309448, 1.8664957284927368, 1.9914182424545288, 2.1163408756256104, 2.2412633895874023, 2.3661859035491943]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 5.0, 15.0, 8.0, 13.0, 17.0, 26.0, 18.0, 22.0, 46.0, 35.0, 31.0, 38.0, 41.0, 58.0, 36.0, 44.0, 59.0, 42.0, 44.0, 49.0, 45.0, 34.0, 41.0, 33.0, 34.0, 26.0, 28.0, 17.0, 26.0, 10.0, 11.0, 10.0, 12.0, 9.0, 10.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.464925765991211, -1.4220956563949585, -1.379265546798706, -1.3364355564117432, -1.2936054468154907, -1.2507753372192383, -1.2079452276229858, -1.1651151180267334, -1.1222851276397705, -1.079455018043518, -1.0366249084472656, -0.993794858455658, -0.9509648084640503, -0.9081346988677979, -0.8653045892715454, -0.822474479675293, -0.7796443700790405, -0.7368142604827881, -0.6939842104911804, -0.651154100894928, -0.6083240509033203, -0.5654939413070679, -0.5226638317108154, -0.4798337519168854, -0.4370036721229553, -0.39417359232902527, -0.3513435125350952, -0.3085134029388428, -0.2656833231449127, -0.22285324335098267, -0.18002313375473022, -0.13719305396080017, -0.09436297416687012, -0.05153288692235947, -0.008702799677848816, 0.03412729501724243, 0.07695737481117249, 0.11978745460510254, 0.16261756420135498, 0.20544764399528503, 0.2482777237892151, 0.29110780358314514, 0.3339378833770752, 0.37676799297332764, 0.4195980727672577, 0.46242815256118774, 0.5052582621574402, 0.5480883121490479, 0.5909184217453003, 0.6337485313415527, 0.6765785813331604, 0.7194086909294128, 0.7622387409210205, 0.805068850517273, 0.8478989601135254, 0.8907290697097778, 0.9335591197013855, 0.9763892292976379, 1.0192192792892456, 1.062049388885498, 1.1048794984817505, 1.147709608078003, 1.1905395984649658, 1.2333697080612183, 1.2761998176574707]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 3.0, 12.0, 14.0, 30.0, 52.0, 80.0, 157.0, 281.0, 454.0, 918.0, 1787.0, 3550.0, 7353.0, 15511.0, 33989.0, 73958.0, 148639.0, 240609.0, 238310.0, 147201.0, 72405.0, 33504.0, 15392.0, 7129.0, 3550.0, 1717.0, 869.0, 457.0, 259.0, 151.0, 91.0, 44.0, 30.0, 23.0, 13.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.173828125, -1.13824462890625, -1.1026611328125, -1.06707763671875, -1.031494140625, -0.99591064453125, -0.9603271484375, -0.92474365234375, -0.88916015625, -0.85357666015625, -0.8179931640625, -0.78240966796875, -0.746826171875, -0.71124267578125, -0.6756591796875, -0.64007568359375, -0.6044921875, -0.56890869140625, -0.5333251953125, -0.49774169921875, -0.462158203125, -0.42657470703125, -0.3909912109375, -0.35540771484375, -0.31982421875, -0.28424072265625, -0.2486572265625, -0.21307373046875, -0.177490234375, -0.14190673828125, -0.1063232421875, -0.07073974609375, -0.03515625, 0.00042724609375, 0.0360107421875, 0.07159423828125, 0.107177734375, 0.14276123046875, 0.1783447265625, 0.21392822265625, 0.24951171875, 0.28509521484375, 0.3206787109375, 0.35626220703125, 0.391845703125, 0.42742919921875, 0.4630126953125, 0.49859619140625, 0.5341796875, 0.56976318359375, 0.6053466796875, 0.64093017578125, 0.676513671875, 0.71209716796875, 0.7476806640625, 0.78326416015625, 0.81884765625, 0.85443115234375, 0.8900146484375, 0.92559814453125, 0.961181640625, 0.99676513671875, 1.0323486328125, 1.06793212890625, 1.103515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 12.0, 11.0, 14.0, 17.0, 10.0, 27.0, 19.0, 31.0, 32.0, 29.0, 32.0, 49.0, 43.0, 50.0, 41.0, 58.0, 56.0, 52.0, 54.0, 49.0, 45.0, 42.0, 36.0, 27.0, 31.0, 21.0, 24.0, 17.0, 11.0, 13.0, 8.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4580078125, -0.4446563720703125, -0.431304931640625, -0.4179534912109375, -0.40460205078125, -0.3912506103515625, -0.377899169921875, -0.3645477294921875, -0.3511962890625, -0.3378448486328125, -0.324493408203125, -0.3111419677734375, -0.29779052734375, -0.2844390869140625, -0.271087646484375, -0.2577362060546875, -0.244384765625, -0.2310333251953125, -0.217681884765625, -0.2043304443359375, -0.19097900390625, -0.1776275634765625, -0.164276123046875, -0.1509246826171875, -0.1375732421875, -0.1242218017578125, -0.110870361328125, -0.0975189208984375, -0.08416748046875, -0.0708160400390625, -0.057464599609375, -0.0441131591796875, -0.03076171875, -0.0174102783203125, -0.004058837890625, 0.0092926025390625, 0.02264404296875, 0.0359954833984375, 0.049346923828125, 0.0626983642578125, 0.0760498046875, 0.0894012451171875, 0.102752685546875, 0.1161041259765625, 0.12945556640625, 0.1428070068359375, 0.156158447265625, 0.1695098876953125, 0.182861328125, 0.1962127685546875, 0.209564208984375, 0.2229156494140625, 0.23626708984375, 0.2496185302734375, 0.262969970703125, 0.2763214111328125, 0.2896728515625, 0.3030242919921875, 0.316375732421875, 0.3297271728515625, 0.34307861328125, 0.3564300537109375, 0.369781494140625, 0.3831329345703125, 0.396484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 15.0, 18.0, 13.0, 38.0, 42.0, 63.0, 108.0, 191.0, 284.0, 478.0, 799.0, 1413.0, 2912.0, 5714.0, 11717.0, 25127.0, 57290.0, 130340.0, 266453.0, 286366.0, 142855.0, 62615.0, 27816.0, 12799.0, 6214.0, 3078.0, 1620.0, 882.0, 472.0, 305.0, 178.0, 88.0, 71.0, 52.0, 32.0, 23.0, 15.0, 9.0, 6.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.184234619140625, -1.14483642578125, -1.105438232421875, -1.0660400390625, -1.026641845703125, -0.98724365234375, -0.947845458984375, -0.908447265625, -0.869049072265625, -0.82965087890625, -0.790252685546875, -0.7508544921875, -0.711456298828125, -0.67205810546875, -0.632659912109375, -0.59326171875, -0.553863525390625, -0.51446533203125, -0.475067138671875, -0.4356689453125, -0.396270751953125, -0.35687255859375, -0.317474365234375, -0.278076171875, -0.238677978515625, -0.19927978515625, -0.159881591796875, -0.1204833984375, -0.081085205078125, -0.04168701171875, -0.002288818359375, 0.037109375, 0.076507568359375, 0.11590576171875, 0.155303955078125, 0.1947021484375, 0.234100341796875, 0.27349853515625, 0.312896728515625, 0.352294921875, 0.391693115234375, 0.43109130859375, 0.470489501953125, 0.5098876953125, 0.549285888671875, 0.58868408203125, 0.628082275390625, 0.66748046875, 0.706878662109375, 0.74627685546875, 0.785675048828125, 0.8250732421875, 0.864471435546875, 0.90386962890625, 0.943267822265625, 0.982666015625, 1.022064208984375, 1.06146240234375, 1.100860595703125, 1.1402587890625, 1.179656982421875, 1.21905517578125, 1.258453369140625, 1.2978515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 3.0, 11.0, 7.0, 11.0, 19.0, 17.0, 22.0, 12.0, 21.0, 24.0, 26.0, 26.0, 20.0, 41.0, 35.0, 32.0, 38.0, 44.0, 45.0, 38.0, 53.0, 29.0, 39.0, 53.0, 38.0, 29.0, 28.0, 32.0, 36.0, 25.0, 25.0, 21.0, 13.0, 16.0, 7.0, 16.0, 7.0, 8.0, 5.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.1473541259765625, -2.083770751953125, -2.0201873779296875, -1.95660400390625, -1.8930206298828125, -1.829437255859375, -1.7658538818359375, -1.7022705078125, -1.6386871337890625, -1.575103759765625, -1.5115203857421875, -1.44793701171875, -1.3843536376953125, -1.320770263671875, -1.2571868896484375, -1.193603515625, -1.1300201416015625, -1.066436767578125, -1.0028533935546875, -0.93927001953125, -0.8756866455078125, -0.812103271484375, -0.7485198974609375, -0.6849365234375, -0.6213531494140625, -0.557769775390625, -0.4941864013671875, -0.43060302734375, -0.3670196533203125, -0.303436279296875, -0.2398529052734375, -0.17626953125, -0.1126861572265625, -0.049102783203125, 0.0144805908203125, 0.07806396484375, 0.1416473388671875, 0.205230712890625, 0.2688140869140625, 0.3323974609375, 0.3959808349609375, 0.459564208984375, 0.5231475830078125, 0.58673095703125, 0.6503143310546875, 0.713897705078125, 0.7774810791015625, 0.841064453125, 0.9046478271484375, 0.968231201171875, 1.0318145751953125, 1.09539794921875, 1.1589813232421875, 1.222564697265625, 1.2861480712890625, 1.3497314453125, 1.4133148193359375, 1.476898193359375, 1.5404815673828125, 1.60406494140625, 1.6676483154296875, 1.731231689453125, 1.7948150634765625, 1.8583984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 13.0, 20.0, 30.0, 35.0, 71.0, 94.0, 182.0, 320.0, 698.0, 1730.0, 6211.0, 44758.0, 846406.0, 133174.0, 10307.0, 2667.0, 880.0, 408.0, 218.0, 116.0, 72.0, 49.0, 34.0, 16.0, 9.0, 12.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.42156982421875, -2.3450927734375, -2.26861572265625, -2.192138671875, -2.11566162109375, -2.0391845703125, -1.96270751953125, -1.88623046875, -1.80975341796875, -1.7332763671875, -1.65679931640625, -1.580322265625, -1.50384521484375, -1.4273681640625, -1.35089111328125, -1.2744140625, -1.19793701171875, -1.1214599609375, -1.04498291015625, -0.968505859375, -0.89202880859375, -0.8155517578125, -0.73907470703125, -0.66259765625, -0.58612060546875, -0.5096435546875, -0.43316650390625, -0.356689453125, -0.28021240234375, -0.2037353515625, -0.12725830078125, -0.05078125, 0.02569580078125, 0.1021728515625, 0.17864990234375, 0.255126953125, 0.33160400390625, 0.4080810546875, 0.48455810546875, 0.56103515625, 0.63751220703125, 0.7139892578125, 0.79046630859375, 0.866943359375, 0.94342041015625, 1.0198974609375, 1.09637451171875, 1.1728515625, 1.24932861328125, 1.3258056640625, 1.40228271484375, 1.478759765625, 1.55523681640625, 1.6317138671875, 1.70819091796875, 1.78466796875, 1.86114501953125, 1.9376220703125, 2.01409912109375, 2.090576171875, 2.16705322265625, 2.2435302734375, 2.32000732421875, 2.396484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 4.0, 12.0, 14.0, 14.0, 25.0, 27.0, 22.0, 39.0, 35.0, 54.0, 74.0, 60.0, 73.0, 70.0, 66.0, 70.0, 55.0, 46.0, 52.0, 33.0, 32.0, 15.0, 21.0, 16.0, 16.0, 8.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015234947204589844, -0.00014814548194408417, -0.0001439414918422699, -0.00013973750174045563, -0.00013553351163864136, -0.0001313295215368271, -0.00012712553143501282, -0.00012292154133319855, -0.00011871755123138428, -0.00011451356112957001, -0.00011030957102775574, -0.00010610558092594147, -0.0001019015908241272, -9.769760072231293e-05, -9.349361062049866e-05, -8.928962051868439e-05, -8.508563041687012e-05, -8.088164031505585e-05, -7.667765021324158e-05, -7.247366011142731e-05, -6.826967000961304e-05, -6.406567990779877e-05, -5.98616898059845e-05, -5.565769970417023e-05, -5.145370960235596e-05, -4.724971950054169e-05, -4.304572939872742e-05, -3.884173929691315e-05, -3.463774919509888e-05, -3.0433759093284607e-05, -2.6229768991470337e-05, -2.2025778889656067e-05, -1.7821788787841797e-05, -1.3617798686027527e-05, -9.413808584213257e-06, -5.209818482398987e-06, -1.0058283805847168e-06, 3.1981617212295532e-06, 7.402151823043823e-06, 1.1606141924858093e-05, 1.5810132026672363e-05, 2.0014122128486633e-05, 2.4218112230300903e-05, 2.8422102332115173e-05, 3.262609243392944e-05, 3.683008253574371e-05, 4.1034072637557983e-05, 4.5238062739372253e-05, 4.9442052841186523e-05, 5.3646042943000793e-05, 5.7850033044815063e-05, 6.205402314662933e-05, 6.62580132484436e-05, 7.046200335025787e-05, 7.466599345207214e-05, 7.886998355388641e-05, 8.307397365570068e-05, 8.727796375751495e-05, 9.148195385932922e-05, 9.56859439611435e-05, 9.988993406295776e-05, 0.00010409392416477203, 0.0001082979142665863, 0.00011250190436840057, 0.00011670589447021484]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 10.0, 18.0, 36.0, 51.0, 79.0, 149.0, 335.0, 774.0, 1951.0, 6735.0, 40812.0, 496534.0, 453748.0, 37717.0, 6274.0, 1904.0, 692.0, 353.0, 149.0, 62.0, 60.0, 31.0, 10.0, 11.0, 7.0, 11.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.6357421875, -1.5845947265625, -1.533447265625, -1.4822998046875, -1.43115234375, -1.3800048828125, -1.328857421875, -1.2777099609375, -1.2265625, -1.1754150390625, -1.124267578125, -1.0731201171875, -1.02197265625, -0.9708251953125, -0.919677734375, -0.8685302734375, -0.8173828125, -0.7662353515625, -0.715087890625, -0.6639404296875, -0.61279296875, -0.5616455078125, -0.510498046875, -0.4593505859375, -0.408203125, -0.3570556640625, -0.305908203125, -0.2547607421875, -0.20361328125, -0.1524658203125, -0.101318359375, -0.0501708984375, 0.0009765625, 0.0521240234375, 0.103271484375, 0.1544189453125, 0.20556640625, 0.2567138671875, 0.307861328125, 0.3590087890625, 0.41015625, 0.4613037109375, 0.512451171875, 0.5635986328125, 0.61474609375, 0.6658935546875, 0.717041015625, 0.7681884765625, 0.8193359375, 0.8704833984375, 0.921630859375, 0.9727783203125, 1.02392578125, 1.0750732421875, 1.126220703125, 1.1773681640625, 1.228515625, 1.2796630859375, 1.330810546875, 1.3819580078125, 1.43310546875, 1.4842529296875, 1.535400390625, 1.5865478515625, 1.6376953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 7.0, 7.0, 17.0, 22.0, 18.0, 41.0, 55.0, 79.0, 120.0, 157.0, 119.0, 109.0, 69.0, 50.0, 46.0, 22.0, 23.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.183563232421875, -2.11907958984375, -2.054595947265625, -1.9901123046875, -1.925628662109375, -1.86114501953125, -1.796661376953125, -1.732177734375, -1.667694091796875, -1.60321044921875, -1.538726806640625, -1.4742431640625, -1.409759521484375, -1.34527587890625, -1.280792236328125, -1.21630859375, -1.151824951171875, -1.08734130859375, -1.022857666015625, -0.9583740234375, -0.893890380859375, -0.82940673828125, -0.764923095703125, -0.700439453125, -0.635955810546875, -0.57147216796875, -0.506988525390625, -0.4425048828125, -0.378021240234375, -0.31353759765625, -0.249053955078125, -0.1845703125, -0.120086669921875, -0.05560302734375, 0.008880615234375, 0.0733642578125, 0.137847900390625, 0.20233154296875, 0.266815185546875, 0.331298828125, 0.395782470703125, 0.46026611328125, 0.524749755859375, 0.5892333984375, 0.653717041015625, 0.71820068359375, 0.782684326171875, 0.84716796875, 0.911651611328125, 0.97613525390625, 1.040618896484375, 1.1051025390625, 1.169586181640625, 1.23406982421875, 1.298553466796875, 1.363037109375, 1.427520751953125, 1.49200439453125, 1.556488037109375, 1.6209716796875, 1.685455322265625, 1.74993896484375, 1.814422607421875, 1.87890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 28.0, 81.0, 177.0, 293.0, 234.0, 147.0, 33.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.814849853515625, -60.18119812011719, -58.54754638671875, -56.91389083862305, -55.28023910522461, -53.64658737182617, -52.012935638427734, -50.37928009033203, -48.745628356933594, -47.111976623535156, -45.47832489013672, -43.844669342041016, -42.21101760864258, -40.57736587524414, -38.9437141418457, -37.31005859375, -35.67640686035156, -34.042755126953125, -32.40910339355469, -30.775449752807617, -29.141796112060547, -27.50814437866211, -25.874492645263672, -24.2408390045166, -22.607189178466797, -20.97353744506836, -19.33988380432129, -17.70623207092285, -16.07257843017578, -14.438926696777344, -12.80527400970459, -11.171621322631836, -9.537967681884766, -7.904314994812012, -6.270662307739258, -4.637010097503662, -3.003357410430908, -1.3697052001953125, 0.2639474868774414, 1.8976001739501953, 3.531252861022949, 5.164905548095703, 6.798558235168457, 8.432210922241211, 10.065862655639648, 11.699515342712402, 13.333168029785156, 14.96682071685791, 16.600473403930664, 18.2341251373291, 19.867778778076172, 21.50143051147461, 23.13508415222168, 24.768735885620117, 26.402389526367188, 28.036041259765625, 29.669692993164062, 31.3033447265625, 32.93699645996094, 34.57065200805664, 36.20430374145508, 37.837955474853516, 39.47160720825195, 41.105262756347656, 42.738914489746094]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 10.0, 17.0, 7.0, 17.0, 19.0, 22.0, 20.0, 31.0, 34.0, 54.0, 46.0, 26.0, 41.0, 51.0, 38.0, 52.0, 51.0, 43.0, 42.0, 45.0, 51.0, 54.0, 28.0, 30.0, 32.0, 25.0, 24.0, 22.0, 11.0, 15.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.628750801086426, -14.241868019104004, -13.854984283447266, -13.468101501464844, -13.081217765808105, -12.694334983825684, -12.307451248168945, -11.920568466186523, -11.533685684204102, -11.14680290222168, -10.759919166564941, -10.37303638458252, -9.986152648925781, -9.59926986694336, -9.212387084960938, -8.8255033493042, -8.438619613647461, -8.051736831665039, -7.664853096008301, -7.277970314025879, -6.891086578369141, -6.504203796386719, -6.117320537567139, -5.730437278747559, -5.3435540199279785, -4.956670761108398, -4.569787502288818, -4.182904243469238, -3.7960212230682373, -3.4091379642486572, -3.0222549438476562, -2.635371685028076, -2.2484893798828125, -1.8616061210632324, -1.474722981452942, -1.0878398418426514, -0.7009565830230713, -0.3140733242034912, 0.07280969619750977, 0.45969295501708984, 0.8465762138366699, 1.23345947265625, 1.6203426122665405, 2.007225751876831, 2.394109010696411, 2.780992269515991, 3.167875289916992, 3.5547585487365723, 3.9416418075561523, 4.328525066375732, 4.7154083251953125, 5.102291107177734, 5.489174842834473, 5.8760576248168945, 6.262940883636475, 6.649824142456055, 7.036707401275635, 7.423590660095215, 7.810473918914795, 8.197357177734375, 8.584239959716797, 8.971123695373535, 9.358006477355957, 9.744890213012695, 10.131772994995117]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 13.0, 20.0, 32.0, 28.0, 50.0, 61.0, 100.0, 149.0, 255.0, 503.0, 845.0, 1897.0, 4820.0, 15880.0, 102168.0, 3993789.0, 55338.0, 11278.0, 3625.0, 1527.0, 798.0, 393.0, 230.0, 179.0, 97.0, 59.0, 39.0, 23.0, 14.0, 18.0, 14.0, 4.0, 9.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.744140625, -2.65936279296875, -2.5745849609375, -2.48980712890625, -2.405029296875, -2.32025146484375, -2.2354736328125, -2.15069580078125, -2.06591796875, -1.98114013671875, -1.8963623046875, -1.81158447265625, -1.726806640625, -1.64202880859375, -1.5572509765625, -1.47247314453125, -1.3876953125, -1.30291748046875, -1.2181396484375, -1.13336181640625, -1.048583984375, -0.96380615234375, -0.8790283203125, -0.79425048828125, -0.70947265625, -0.62469482421875, -0.5399169921875, -0.45513916015625, -0.370361328125, -0.28558349609375, -0.2008056640625, -0.11602783203125, -0.03125, 0.05352783203125, 0.1383056640625, 0.22308349609375, 0.307861328125, 0.39263916015625, 0.4774169921875, 0.56219482421875, 0.64697265625, 0.73175048828125, 0.8165283203125, 0.90130615234375, 0.986083984375, 1.07086181640625, 1.1556396484375, 1.24041748046875, 1.3251953125, 1.40997314453125, 1.4947509765625, 1.57952880859375, 1.664306640625, 1.74908447265625, 1.8338623046875, 1.91864013671875, 2.00341796875, 2.08819580078125, 2.1729736328125, 2.25775146484375, 2.342529296875, 2.42730712890625, 2.5120849609375, 2.59686279296875, 2.681640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 10.0, 11.0, 6.0, 11.0, 17.0, 26.0, 26.0, 22.0, 32.0, 35.0, 45.0, 44.0, 58.0, 66.0, 51.0, 49.0, 66.0, 62.0, 64.0, 35.0, 41.0, 36.0, 30.0, 33.0, 18.0, 16.0, 21.0, 18.0, 12.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46240234375, -0.44673919677734375, -0.4310760498046875, -0.41541290283203125, -0.399749755859375, -0.38408660888671875, -0.3684234619140625, -0.35276031494140625, -0.33709716796875, -0.32143402099609375, -0.3057708740234375, -0.29010772705078125, -0.274444580078125, -0.25878143310546875, -0.2431182861328125, -0.22745513916015625, -0.2117919921875, -0.19612884521484375, -0.1804656982421875, -0.16480255126953125, -0.149139404296875, -0.13347625732421875, -0.1178131103515625, -0.10214996337890625, -0.08648681640625, -0.07082366943359375, -0.0551605224609375, -0.03949737548828125, -0.023834228515625, -0.00817108154296875, 0.0074920654296875, 0.02315521240234375, 0.038818359375, 0.05448150634765625, 0.0701446533203125, 0.08580780029296875, 0.101470947265625, 0.11713409423828125, 0.1327972412109375, 0.14846038818359375, 0.16412353515625, 0.17978668212890625, 0.1954498291015625, 0.21111297607421875, 0.226776123046875, 0.24243927001953125, 0.2581024169921875, 0.27376556396484375, 0.2894287109375, 0.30509185791015625, 0.3207550048828125, 0.33641815185546875, 0.352081298828125, 0.36774444580078125, 0.3834075927734375, 0.39907073974609375, 0.41473388671875, 0.43039703369140625, 0.4460601806640625, 0.46172332763671875, 0.477386474609375, 0.49304962158203125, 0.5087127685546875, 0.5243759155273438, 0.5400390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 5.0, 18.0, 8.0, 14.0, 25.0, 31.0, 38.0, 55.0, 66.0, 95.0, 134.0, 198.0, 288.0, 428.0, 705.0, 1123.0, 1935.0, 3619.0, 7237.0, 17678.0, 59039.0, 3501558.0, 518785.0, 50630.0, 15843.0, 6726.0, 3208.0, 1764.0, 977.0, 626.0, 417.0, 270.0, 201.0, 140.0, 103.0, 68.0, 59.0, 36.0, 24.0, 19.0, 15.0, 16.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-2.796875, -2.71197509765625, -2.6270751953125, -2.54217529296875, -2.457275390625, -2.37237548828125, -2.2874755859375, -2.20257568359375, -2.11767578125, -2.03277587890625, -1.9478759765625, -1.86297607421875, -1.778076171875, -1.69317626953125, -1.6082763671875, -1.52337646484375, -1.4384765625, -1.35357666015625, -1.2686767578125, -1.18377685546875, -1.098876953125, -1.01397705078125, -0.9290771484375, -0.84417724609375, -0.75927734375, -0.67437744140625, -0.5894775390625, -0.50457763671875, -0.419677734375, -0.33477783203125, -0.2498779296875, -0.16497802734375, -0.080078125, 0.00482177734375, 0.0897216796875, 0.17462158203125, 0.259521484375, 0.34442138671875, 0.4293212890625, 0.51422119140625, 0.59912109375, 0.68402099609375, 0.7689208984375, 0.85382080078125, 0.938720703125, 1.02362060546875, 1.1085205078125, 1.19342041015625, 1.2783203125, 1.36322021484375, 1.4481201171875, 1.53302001953125, 1.617919921875, 1.70281982421875, 1.7877197265625, 1.87261962890625, 1.95751953125, 2.04241943359375, 2.1273193359375, 2.21221923828125, 2.297119140625, 2.38201904296875, 2.4669189453125, 2.55181884765625, 2.63671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 10.0, 9.0, 19.0, 24.0, 59.0, 132.0, 2568.0, 968.0, 118.0, 58.0, 31.0, 22.0, 16.0, 11.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4227371215820312, -1.3903961181640625, -1.3580551147460938, -1.325714111328125, -1.2933731079101562, -1.2610321044921875, -1.2286911010742188, -1.19635009765625, -1.1640090942382812, -1.1316680908203125, -1.0993270874023438, -1.066986083984375, -1.0346450805664062, -1.0023040771484375, -0.9699630737304688, -0.9376220703125, -0.9052810668945312, -0.8729400634765625, -0.8405990600585938, -0.808258056640625, -0.7759170532226562, -0.7435760498046875, -0.7112350463867188, -0.67889404296875, -0.6465530395507812, -0.6142120361328125, -0.5818710327148438, -0.549530029296875, -0.5171890258789062, -0.4848480224609375, -0.45250701904296875, -0.420166015625, -0.38782501220703125, -0.3554840087890625, -0.32314300537109375, -0.290802001953125, -0.25846099853515625, -0.2261199951171875, -0.19377899169921875, -0.16143798828125, -0.12909698486328125, -0.0967559814453125, -0.06441497802734375, -0.032073974609375, 0.00026702880859375, 0.0326080322265625, 0.06494903564453125, 0.0972900390625, 0.12963104248046875, 0.1619720458984375, 0.19431304931640625, 0.226654052734375, 0.25899505615234375, 0.2913360595703125, 0.32367706298828125, 0.35601806640625, 0.38835906982421875, 0.4207000732421875, 0.45304107666015625, 0.485382080078125, 0.5177230834960938, 0.5500640869140625, 0.5824050903320312, 0.61474609375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 18.0, 36.0, 75.0, 119.0, 160.0, 173.0, 144.0, 102.0, 86.0, 46.0, 17.0, 11.0, 9.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4579567909240723, -2.2746176719665527, -2.091278553009033, -1.9079391956329346, -1.724600076675415, -1.5412609577178955, -1.3579217195510864, -1.1745824813842773, -0.9912433624267578, -0.8079041838645935, -0.6245650053024292, -0.4412258267402649, -0.2578866481781006, -0.07454746961593628, 0.10879170894622803, 0.2921309471130371, 0.47547006607055664, 0.658809244632721, 0.8421484231948853, 1.0254876613616943, 1.2088267803192139, 1.3921658992767334, 1.5755051374435425, 1.7588443756103516, 1.942183494567871, 2.1255226135253906, 2.30886173248291, 2.492201089859009, 2.6755402088165283, 2.858879327774048, 3.0422186851501465, 3.225557804107666, 3.4088964462280273, 3.592235565185547, 3.7755746841430664, 3.958914041519165, 4.1422529220581055, 4.325592517852783, 4.508931636810303, 4.692270755767822, 4.875609874725342, 5.058948993682861, 5.242288112640381, 5.4256272315979, 5.608966827392578, 5.792305946350098, 5.975645065307617, 6.158984184265137, 6.342323303222656, 6.525662422180176, 6.709001541137695, 6.892340660095215, 7.075679779052734, 7.259019374847412, 7.442358493804932, 7.625697612762451, 7.809036731719971, 7.99237585067749, 8.175715446472168, 8.359054565429688, 8.542393684387207, 8.725732803344727, 8.909071922302246, 9.092411041259766, 9.275750160217285]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 9.0, 8.0, 8.0, 8.0, 4.0, 15.0, 16.0, 14.0, 19.0, 24.0, 30.0, 23.0, 31.0, 27.0, 40.0, 30.0, 47.0, 50.0, 41.0, 42.0, 40.0, 41.0, 45.0, 33.0, 43.0, 32.0, 31.0, 23.0, 22.0, 30.0, 29.0, 24.0, 17.0, 15.0, 11.0, 17.0, 14.0, 9.0, 4.0, 6.0, 5.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7019164562225342, -1.6513633728027344, -1.6008104085922241, -1.5502574443817139, -1.499704360961914, -1.4491512775421143, -1.398598313331604, -1.3480453491210938, -1.297492265701294, -1.2469391822814941, -1.1963862180709839, -1.1458332538604736, -1.0952801704406738, -1.044727087020874, -0.9941741228103638, -0.9436210989952087, -0.8930680751800537, -0.8425150513648987, -0.7919620275497437, -0.7414090037345886, -0.6908559799194336, -0.6403029561042786, -0.5897499322891235, -0.5391969084739685, -0.4886438846588135, -0.43809086084365845, -0.3875378370285034, -0.3369848132133484, -0.28643178939819336, -0.23587876558303833, -0.1853257417678833, -0.13477271795272827, -0.08421969413757324, -0.03366667032241821, 0.016886353492736816, 0.06743937730789185, 0.11799240112304688, 0.1685454249382019, 0.21909844875335693, 0.26965147256851196, 0.320204496383667, 0.370757520198822, 0.42131054401397705, 0.4718635678291321, 0.5224165916442871, 0.5729696154594421, 0.6235226392745972, 0.6740756630897522, 0.7246286869049072, 0.7751817107200623, 0.8257347345352173, 0.8762877583503723, 0.9268407821655273, 0.9773938059806824, 1.0279468297958374, 1.0784997940063477, 1.1290528774261475, 1.1796059608459473, 1.2301589250564575, 1.2807118892669678, 1.3312649726867676, 1.3818180561065674, 1.4323710203170776, 1.482923984527588, 1.5334770679473877]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 9.0, 12.0, 13.0, 20.0, 33.0, 35.0, 52.0, 70.0, 109.0, 155.0, 246.0, 388.0, 545.0, 773.0, 1287.0, 2127.0, 3409.0, 5995.0, 10407.0, 19240.0, 37477.0, 72573.0, 140358.0, 225742.0, 227258.0, 142005.0, 74366.0, 38056.0, 19786.0, 10611.0, 5937.0, 3472.0, 2052.0, 1364.0, 847.0, 522.0, 371.0, 216.0, 186.0, 125.0, 79.0, 46.0, 46.0, 28.0, 19.0, 23.0, 12.0, 11.0, 8.0, 6.0, 6.0, 4.0, 3.0, 6.0], "bins": [-1.25390625, -1.217041015625, -1.18017578125, -1.143310546875, -1.1064453125, -1.069580078125, -1.03271484375, -0.995849609375, -0.958984375, -0.922119140625, -0.88525390625, -0.848388671875, -0.8115234375, -0.774658203125, -0.73779296875, -0.700927734375, -0.6640625, -0.627197265625, -0.59033203125, -0.553466796875, -0.5166015625, -0.479736328125, -0.44287109375, -0.406005859375, -0.369140625, -0.332275390625, -0.29541015625, -0.258544921875, -0.2216796875, -0.184814453125, -0.14794921875, -0.111083984375, -0.07421875, -0.037353515625, -0.00048828125, 0.036376953125, 0.0732421875, 0.110107421875, 0.14697265625, 0.183837890625, 0.220703125, 0.257568359375, 0.29443359375, 0.331298828125, 0.3681640625, 0.405029296875, 0.44189453125, 0.478759765625, 0.515625, 0.552490234375, 0.58935546875, 0.626220703125, 0.6630859375, 0.699951171875, 0.73681640625, 0.773681640625, 0.810546875, 0.847412109375, 0.88427734375, 0.921142578125, 0.9580078125, 0.994873046875, 1.03173828125, 1.068603515625, 1.10546875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 13.0, 11.0, 10.0, 16.0, 22.0, 28.0, 26.0, 39.0, 37.0, 41.0, 48.0, 44.0, 48.0, 58.0, 54.0, 41.0, 74.0, 58.0, 50.0, 50.0, 45.0, 30.0, 25.0, 23.0, 15.0, 19.0, 21.0, 15.0, 12.0, 2.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5132217407226562, -0.4947052001953125, -0.47618865966796875, -0.457672119140625, -0.43915557861328125, -0.4206390380859375, -0.40212249755859375, -0.38360595703125, -0.36508941650390625, -0.3465728759765625, -0.32805633544921875, -0.309539794921875, -0.29102325439453125, -0.2725067138671875, -0.25399017333984375, -0.2354736328125, -0.21695709228515625, -0.1984405517578125, -0.17992401123046875, -0.161407470703125, -0.14289093017578125, -0.1243743896484375, -0.10585784912109375, -0.08734130859375, -0.06882476806640625, -0.0503082275390625, -0.03179168701171875, -0.013275146484375, 0.00524139404296875, 0.0237579345703125, 0.04227447509765625, 0.060791015625, 0.07930755615234375, 0.0978240966796875, 0.11634063720703125, 0.134857177734375, 0.15337371826171875, 0.1718902587890625, 0.19040679931640625, 0.20892333984375, 0.22743988037109375, 0.2459564208984375, 0.26447296142578125, 0.282989501953125, 0.30150604248046875, 0.3200225830078125, 0.33853912353515625, 0.3570556640625, 0.37557220458984375, 0.3940887451171875, 0.41260528564453125, 0.431121826171875, 0.44963836669921875, 0.4681549072265625, 0.48667144775390625, 0.50518798828125, 0.5237045288085938, 0.5422210693359375, 0.5607376098632812, 0.579254150390625, 0.5977706909179688, 0.6162872314453125, 0.6348037719726562, 0.6533203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 18.0, 29.0, 51.0, 46.0, 68.0, 123.0, 217.0, 379.0, 555.0, 1069.0, 2095.0, 4581.0, 11014.0, 31120.0, 101162.0, 336529.0, 381424.0, 119515.0, 35624.0, 12594.0, 5177.0, 2337.0, 1136.0, 619.0, 363.0, 225.0, 148.0, 93.0, 64.0, 39.0, 33.0, 22.0, 11.0, 12.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.17816162109375, -2.1102294921875, -2.04229736328125, -1.974365234375, -1.90643310546875, -1.8385009765625, -1.77056884765625, -1.70263671875, -1.63470458984375, -1.5667724609375, -1.49884033203125, -1.430908203125, -1.36297607421875, -1.2950439453125, -1.22711181640625, -1.1591796875, -1.09124755859375, -1.0233154296875, -0.95538330078125, -0.887451171875, -0.81951904296875, -0.7515869140625, -0.68365478515625, -0.61572265625, -0.54779052734375, -0.4798583984375, -0.41192626953125, -0.343994140625, -0.27606201171875, -0.2081298828125, -0.14019775390625, -0.072265625, -0.00433349609375, 0.0635986328125, 0.13153076171875, 0.199462890625, 0.26739501953125, 0.3353271484375, 0.40325927734375, 0.47119140625, 0.53912353515625, 0.6070556640625, 0.67498779296875, 0.742919921875, 0.81085205078125, 0.8787841796875, 0.94671630859375, 1.0146484375, 1.08258056640625, 1.1505126953125, 1.21844482421875, 1.286376953125, 1.35430908203125, 1.4222412109375, 1.49017333984375, 1.55810546875, 1.62603759765625, 1.6939697265625, 1.76190185546875, 1.829833984375, 1.89776611328125, 1.9656982421875, 2.03363037109375, 2.1015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 3.0, 8.0, 14.0, 15.0, 15.0, 23.0, 18.0, 32.0, 26.0, 28.0, 33.0, 35.0, 42.0, 43.0, 51.0, 52.0, 49.0, 43.0, 49.0, 40.0, 37.0, 42.0, 26.0, 39.0, 27.0, 36.0, 29.0, 23.0, 19.0, 11.0, 15.0, 12.0, 12.0, 6.0, 7.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.880859375, -2.79632568359375, -2.7117919921875, -2.62725830078125, -2.542724609375, -2.45819091796875, -2.3736572265625, -2.28912353515625, -2.20458984375, -2.12005615234375, -2.0355224609375, -1.95098876953125, -1.866455078125, -1.78192138671875, -1.6973876953125, -1.61285400390625, -1.5283203125, -1.44378662109375, -1.3592529296875, -1.27471923828125, -1.190185546875, -1.10565185546875, -1.0211181640625, -0.93658447265625, -0.85205078125, -0.76751708984375, -0.6829833984375, -0.59844970703125, -0.513916015625, -0.42938232421875, -0.3448486328125, -0.26031494140625, -0.17578125, -0.09124755859375, -0.0067138671875, 0.07781982421875, 0.162353515625, 0.24688720703125, 0.3314208984375, 0.41595458984375, 0.50048828125, 0.58502197265625, 0.6695556640625, 0.75408935546875, 0.838623046875, 0.92315673828125, 1.0076904296875, 1.09222412109375, 1.1767578125, 1.26129150390625, 1.3458251953125, 1.43035888671875, 1.514892578125, 1.59942626953125, 1.6839599609375, 1.76849365234375, 1.85302734375, 1.93756103515625, 2.0220947265625, 2.10662841796875, 2.191162109375, 2.27569580078125, 2.3602294921875, 2.44476318359375, 2.529296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 12.0, 20.0, 19.0, 23.0, 23.0, 61.0, 67.0, 112.0, 170.0, 265.0, 516.0, 1095.0, 2675.0, 8223.0, 36230.0, 292888.0, 604215.0, 80141.0, 14512.0, 4032.0, 1562.0, 699.0, 384.0, 194.0, 128.0, 76.0, 60.0, 42.0, 26.0, 21.0, 12.0, 10.0, 11.0, 4.0, 2.0, 7.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7451171875, -1.687347412109375, -1.62957763671875, -1.571807861328125, -1.5140380859375, -1.456268310546875, -1.39849853515625, -1.340728759765625, -1.282958984375, -1.225189208984375, -1.16741943359375, -1.109649658203125, -1.0518798828125, -0.994110107421875, -0.93634033203125, -0.878570556640625, -0.82080078125, -0.763031005859375, -0.70526123046875, -0.647491455078125, -0.5897216796875, -0.531951904296875, -0.47418212890625, -0.416412353515625, -0.358642578125, -0.300872802734375, -0.24310302734375, -0.185333251953125, -0.1275634765625, -0.069793701171875, -0.01202392578125, 0.045745849609375, 0.103515625, 0.161285400390625, 0.21905517578125, 0.276824951171875, 0.3345947265625, 0.392364501953125, 0.45013427734375, 0.507904052734375, 0.565673828125, 0.623443603515625, 0.68121337890625, 0.738983154296875, 0.7967529296875, 0.854522705078125, 0.91229248046875, 0.970062255859375, 1.02783203125, 1.085601806640625, 1.14337158203125, 1.201141357421875, 1.2589111328125, 1.316680908203125, 1.37445068359375, 1.432220458984375, 1.489990234375, 1.547760009765625, 1.60552978515625, 1.663299560546875, 1.7210693359375, 1.778839111328125, 1.83660888671875, 1.894378662109375, 1.9521484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 2.0, 9.0, 11.0, 20.0, 16.0, 16.0, 24.0, 46.0, 37.0, 57.0, 75.0, 65.0, 78.0, 86.0, 87.0, 72.0, 56.0, 48.0, 39.0, 37.0, 26.0, 20.0, 16.0, 10.0, 8.0, 7.0, 8.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0002117156982421875, -0.0002048984169960022, -0.0001980811357498169, -0.0001912638545036316, -0.0001844465732574463, -0.00017762929201126099, -0.00017081201076507568, -0.00016399472951889038, -0.00015717744827270508, -0.00015036016702651978, -0.00014354288578033447, -0.00013672560453414917, -0.00012990832328796387, -0.00012309104204177856, -0.00011627376079559326, -0.00010945647954940796, -0.00010263919830322266, -9.582191705703735e-05, -8.900463581085205e-05, -8.218735456466675e-05, -7.537007331848145e-05, -6.855279207229614e-05, -6.173551082611084e-05, -5.491822957992554e-05, -4.8100948333740234e-05, -4.128366708755493e-05, -3.446638584136963e-05, -2.7649104595184326e-05, -2.0831823348999023e-05, -1.401454210281372e-05, -7.197260856628418e-06, -3.7997961044311523e-07, 6.4373016357421875e-06, 1.325458288192749e-05, 2.0071864128112793e-05, 2.6889145374298096e-05, 3.37064266204834e-05, 4.05237078666687e-05, 4.7340989112854004e-05, 5.415827035903931e-05, 6.097555160522461e-05, 6.779283285140991e-05, 7.461011409759521e-05, 8.142739534378052e-05, 8.824467658996582e-05, 9.506195783615112e-05, 0.00010187923908233643, 0.00010869652032852173, 0.00011551380157470703, 0.00012233108282089233, 0.00012914836406707764, 0.00013596564531326294, 0.00014278292655944824, 0.00014960020780563354, 0.00015641748905181885, 0.00016323477029800415, 0.00017005205154418945, 0.00017686933279037476, 0.00018368661403656006, 0.00019050389528274536, 0.00019732117652893066, 0.00020413845777511597, 0.00021095573902130127, 0.00021777302026748657, 0.00022459030151367188]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 18.0, 23.0, 26.0, 55.0, 80.0, 139.0, 256.0, 506.0, 1209.0, 3467.0, 14010.0, 112696.0, 735120.0, 156933.0, 17624.0, 3870.0, 1303.0, 540.0, 255.0, 136.0, 69.0, 66.0, 55.0, 26.0, 18.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-2.771484375, -2.704803466796875, -2.63812255859375, -2.571441650390625, -2.5047607421875, -2.438079833984375, -2.37139892578125, -2.304718017578125, -2.238037109375, -2.171356201171875, -2.10467529296875, -2.037994384765625, -1.9713134765625, -1.904632568359375, -1.83795166015625, -1.771270751953125, -1.70458984375, -1.637908935546875, -1.57122802734375, -1.504547119140625, -1.4378662109375, -1.371185302734375, -1.30450439453125, -1.237823486328125, -1.171142578125, -1.104461669921875, -1.03778076171875, -0.971099853515625, -0.9044189453125, -0.837738037109375, -0.77105712890625, -0.704376220703125, -0.6376953125, -0.571014404296875, -0.50433349609375, -0.437652587890625, -0.3709716796875, -0.304290771484375, -0.23760986328125, -0.170928955078125, -0.104248046875, -0.037567138671875, 0.02911376953125, 0.095794677734375, 0.1624755859375, 0.229156494140625, 0.29583740234375, 0.362518310546875, 0.42919921875, 0.495880126953125, 0.56256103515625, 0.629241943359375, 0.6959228515625, 0.762603759765625, 0.82928466796875, 0.895965576171875, 0.962646484375, 1.029327392578125, 1.09600830078125, 1.162689208984375, 1.2293701171875, 1.296051025390625, 1.36273193359375, 1.429412841796875, 1.49609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 5.0, 8.0, 7.0, 10.0, 20.0, 16.0, 30.0, 29.0, 39.0, 52.0, 65.0, 53.0, 74.0, 63.0, 83.0, 75.0, 65.0, 51.0, 45.0, 58.0, 35.0, 27.0, 22.0, 22.0, 4.0, 11.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4775390625, -1.437042236328125, -1.39654541015625, -1.356048583984375, -1.3155517578125, -1.275054931640625, -1.23455810546875, -1.194061279296875, -1.153564453125, -1.113067626953125, -1.07257080078125, -1.032073974609375, -0.9915771484375, -0.951080322265625, -0.91058349609375, -0.870086669921875, -0.82958984375, -0.789093017578125, -0.74859619140625, -0.708099365234375, -0.6676025390625, -0.627105712890625, -0.58660888671875, -0.546112060546875, -0.505615234375, -0.465118408203125, -0.42462158203125, -0.384124755859375, -0.3436279296875, -0.303131103515625, -0.26263427734375, -0.222137451171875, -0.181640625, -0.141143798828125, -0.10064697265625, -0.060150146484375, -0.0196533203125, 0.020843505859375, 0.06134033203125, 0.101837158203125, 0.142333984375, 0.182830810546875, 0.22332763671875, 0.263824462890625, 0.3043212890625, 0.344818115234375, 0.38531494140625, 0.425811767578125, 0.46630859375, 0.506805419921875, 0.54730224609375, 0.587799072265625, 0.6282958984375, 0.668792724609375, 0.70928955078125, 0.749786376953125, 0.790283203125, 0.830780029296875, 0.87127685546875, 0.911773681640625, 0.9522705078125, 0.992767333984375, 1.03326416015625, 1.073760986328125, 1.1142578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 19.0, 35.0, 35.0, 49.0, 85.0, 96.0, 113.0, 121.0, 129.0, 103.0, 65.0, 51.0, 36.0, 21.0, 12.0, 11.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.681549072265625, -22.873117446899414, -22.064685821533203, -21.256254196166992, -20.44782257080078, -19.63939094543457, -18.83095932006836, -18.02252769470215, -17.214096069335938, -16.405664443969727, -15.597232818603516, -14.788801193237305, -13.980369567871094, -13.171937942504883, -12.363506317138672, -11.555074691772461, -10.74664306640625, -9.938211441040039, -9.129779815673828, -8.321348190307617, -7.512916564941406, -6.704484939575195, -5.896053314208984, -5.087621688842773, -4.2791900634765625, -3.4707584381103516, -2.6623268127441406, -1.8538951873779297, -1.0454635620117188, -0.2370319366455078, 0.5713996887207031, 1.379831314086914, 2.188264846801758, 2.9966964721679688, 3.8051280975341797, 4.613559722900391, 5.421991348266602, 6.2304229736328125, 7.038854598999023, 7.847286224365234, 8.655717849731445, 9.464149475097656, 10.272581100463867, 11.081012725830078, 11.889444351196289, 12.6978759765625, 13.506307601928711, 14.314739227294922, 15.123170852661133, 15.931602478027344, 16.740034103393555, 17.548465728759766, 18.356897354125977, 19.165328979492188, 19.9737606048584, 20.78219223022461, 21.59062385559082, 22.39905548095703, 23.207487106323242, 24.015918731689453, 24.824350357055664, 25.632781982421875, 26.441213607788086, 27.249645233154297, 28.058076858520508]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 3.0, 6.0, 5.0, 13.0, 12.0, 13.0, 23.0, 22.0, 28.0, 33.0, 29.0, 50.0, 35.0, 64.0, 49.0, 62.0, 46.0, 61.0, 57.0, 42.0, 47.0, 44.0, 38.0, 32.0, 40.0, 27.0, 27.0, 21.0, 15.0, 11.0, 13.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.115697860717773, -11.647721290588379, -11.179744720458984, -10.71176815032959, -10.243791580200195, -9.7758150100708, -9.307838439941406, -8.839862823486328, -8.371885299682617, -7.903908729553223, -7.435932159423828, -6.967955589294434, -6.499979019165039, -6.0320024490356445, -5.564026355743408, -5.096049785614014, -4.628073692321777, -4.160097122192383, -3.6921205520629883, -3.224144220352173, -2.7561676502227783, -2.288191080093384, -1.8202147483825684, -1.3522381782531738, -0.8842616081237793, -0.41628509759902954, 0.051691412925720215, 0.5196678638458252, 0.9876444339752197, 1.4556210041046143, 1.9235973358154297, 2.391573905944824, 2.8595504760742188, 3.3275270462036133, 3.795503616333008, 4.263480186462402, 4.731456756591797, 5.199433326721191, 5.667409420013428, 6.135385990142822, 6.603362560272217, 7.071339130401611, 7.539315700531006, 8.007291793823242, 8.475268363952637, 8.943244934082031, 9.411221504211426, 9.87919807434082, 10.347174644470215, 10.81515121459961, 11.283127784729004, 11.751104354858398, 12.219080924987793, 12.687057495117188, 13.155033111572266, 13.623010635375977, 14.090986251831055, 14.55896282196045, 15.026939392089844, 15.494915962219238, 15.962892532348633, 16.43086814880371, 16.898845672607422, 17.3668212890625, 17.83479881286621]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 6.0, 13.0, 28.0, 33.0, 48.0, 98.0, 215.0, 436.0, 965.0, 2446.0, 8300.0, 79308.0, 4080153.0, 15990.0, 3682.0, 1286.0, 603.0, 299.0, 138.0, 89.0, 51.0, 27.0, 22.0, 15.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.26318359375, -5.0888671875, -4.91455078125, -4.740234375, -4.56591796875, -4.3916015625, -4.21728515625, -4.04296875, -3.86865234375, -3.6943359375, -3.52001953125, -3.345703125, -3.17138671875, -2.9970703125, -2.82275390625, -2.6484375, -2.47412109375, -2.2998046875, -2.12548828125, -1.951171875, -1.77685546875, -1.6025390625, -1.42822265625, -1.25390625, -1.07958984375, -0.9052734375, -0.73095703125, -0.556640625, -0.38232421875, -0.2080078125, -0.03369140625, 0.140625, 0.31494140625, 0.4892578125, 0.66357421875, 0.837890625, 1.01220703125, 1.1865234375, 1.36083984375, 1.53515625, 1.70947265625, 1.8837890625, 2.05810546875, 2.232421875, 2.40673828125, 2.5810546875, 2.75537109375, 2.9296875, 3.10400390625, 3.2783203125, 3.45263671875, 3.626953125, 3.80126953125, 3.9755859375, 4.14990234375, 4.32421875, 4.49853515625, 4.6728515625, 4.84716796875, 5.021484375, 5.19580078125, 5.3701171875, 5.54443359375, 5.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 13.0, 6.0, 19.0, 21.0, 23.0, 33.0, 45.0, 49.0, 58.0, 58.0, 61.0, 64.0, 66.0, 58.0, 67.0, 57.0, 48.0, 36.0, 38.0, 32.0, 27.0, 19.0, 23.0, 10.0, 11.0, 9.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.80517578125, -0.7825088500976562, -0.7598419189453125, -0.7371749877929688, -0.714508056640625, -0.6918411254882812, -0.6691741943359375, -0.6465072631835938, -0.62384033203125, -0.6011734008789062, -0.5785064697265625, -0.5558395385742188, -0.533172607421875, -0.5105056762695312, -0.4878387451171875, -0.46517181396484375, -0.4425048828125, -0.41983795166015625, -0.3971710205078125, -0.37450408935546875, -0.351837158203125, -0.32917022705078125, -0.3065032958984375, -0.28383636474609375, -0.26116943359375, -0.23850250244140625, -0.2158355712890625, -0.19316864013671875, -0.170501708984375, -0.14783477783203125, -0.1251678466796875, -0.10250091552734375, -0.079833984375, -0.05716705322265625, -0.0345001220703125, -0.01183319091796875, 0.010833740234375, 0.03350067138671875, 0.0561676025390625, 0.07883453369140625, 0.10150146484375, 0.12416839599609375, 0.1468353271484375, 0.16950225830078125, 0.192169189453125, 0.21483612060546875, 0.2375030517578125, 0.26016998291015625, 0.2828369140625, 0.30550384521484375, 0.3281707763671875, 0.35083770751953125, 0.373504638671875, 0.39617156982421875, 0.4188385009765625, 0.44150543212890625, 0.46417236328125, 0.48683929443359375, 0.5095062255859375, 0.5321731567382812, 0.554840087890625, 0.5775070190429688, 0.6001739501953125, 0.6228408813476562, 0.6455078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 11.0, 18.0, 14.0, 22.0, 23.0, 29.0, 48.0, 80.0, 118.0, 221.0, 359.0, 667.0, 1491.0, 3507.0, 10899.0, 74194.0, 4056017.0, 34471.0, 7016.0, 2555.0, 1167.0, 521.0, 277.0, 189.0, 94.0, 74.0, 53.0, 30.0, 23.0, 12.0, 16.0, 17.0, 8.0, 7.0, 3.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.32366943359375, -6.1395263671875, -5.95538330078125, -5.771240234375, -5.58709716796875, -5.4029541015625, -5.21881103515625, -5.03466796875, -4.85052490234375, -4.6663818359375, -4.48223876953125, -4.298095703125, -4.11395263671875, -3.9298095703125, -3.74566650390625, -3.5615234375, -3.37738037109375, -3.1932373046875, -3.00909423828125, -2.824951171875, -2.64080810546875, -2.4566650390625, -2.27252197265625, -2.08837890625, -1.90423583984375, -1.7200927734375, -1.53594970703125, -1.351806640625, -1.16766357421875, -0.9835205078125, -0.79937744140625, -0.615234375, -0.43109130859375, -0.2469482421875, -0.06280517578125, 0.121337890625, 0.30548095703125, 0.4896240234375, 0.67376708984375, 0.85791015625, 1.04205322265625, 1.2261962890625, 1.41033935546875, 1.594482421875, 1.77862548828125, 1.9627685546875, 2.14691162109375, 2.3310546875, 2.51519775390625, 2.6993408203125, 2.88348388671875, 3.067626953125, 3.25177001953125, 3.4359130859375, 3.62005615234375, 3.80419921875, 3.98834228515625, 4.1724853515625, 4.35662841796875, 4.540771484375, 4.72491455078125, 4.9090576171875, 5.09320068359375, 5.27734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 25.0, 50.0, 117.0, 3643.0, 116.0, 40.0, 23.0, 15.0, 9.0, 6.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.1952972412109375, -1.148406982421875, -1.1015167236328125, -1.05462646484375, -1.0077362060546875, -0.960845947265625, -0.9139556884765625, -0.8670654296875, -0.8201751708984375, -0.773284912109375, -0.7263946533203125, -0.67950439453125, -0.6326141357421875, -0.585723876953125, -0.5388336181640625, -0.491943359375, -0.4450531005859375, -0.398162841796875, -0.3512725830078125, -0.30438232421875, -0.2574920654296875, -0.210601806640625, -0.1637115478515625, -0.1168212890625, -0.0699310302734375, -0.023040771484375, 0.0238494873046875, 0.07073974609375, 0.1176300048828125, 0.164520263671875, 0.2114105224609375, 0.25830078125, 0.3051910400390625, 0.352081298828125, 0.3989715576171875, 0.44586181640625, 0.4927520751953125, 0.539642333984375, 0.5865325927734375, 0.6334228515625, 0.6803131103515625, 0.727203369140625, 0.7740936279296875, 0.82098388671875, 0.8678741455078125, 0.914764404296875, 0.9616546630859375, 1.008544921875, 1.0554351806640625, 1.102325439453125, 1.1492156982421875, 1.19610595703125, 1.2429962158203125, 1.289886474609375, 1.3367767333984375, 1.3836669921875, 1.4305572509765625, 1.477447509765625, 1.5243377685546875, 1.57122802734375, 1.6181182861328125, 1.665008544921875, 1.7118988037109375, 1.7587890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 5.0, 16.0, 34.0, 46.0, 61.0, 76.0, 89.0, 105.0, 94.0, 108.0, 90.0, 86.0, 52.0, 44.0, 27.0, 13.0, 11.0, 13.0, 8.0, 5.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.702145576477051, -2.5952060222625732, -2.4882664680480957, -2.381326913833618, -2.2743873596191406, -2.167447805404663, -2.0605082511901855, -1.9535688161849976, -1.84662926197052, -1.7396897077560425, -1.632750153541565, -1.525810718536377, -1.4188711643218994, -1.3119316101074219, -1.2049920558929443, -1.0980525016784668, -0.9911129474639893, -0.8841733932495117, -0.7772338390350342, -0.6702943444252014, -0.5633547902107239, -0.45641523599624634, -0.3494757413864136, -0.24253618717193604, -0.1355966329574585, -0.02865709364414215, 0.0782824456691742, 0.18522197008132935, 0.2921615242958069, 0.3991010785102844, 0.5060405731201172, 0.6129801273345947, 0.7199196815490723, 0.8268592357635498, 0.9337987899780273, 1.0407383441925049, 1.1476778984069824, 1.25461745262146, 1.361556887626648, 1.4684964418411255, 1.575435996055603, 1.6823755502700806, 1.789315104484558, 1.896254539489746, 2.0031940937042236, 2.110133647918701, 2.2170732021331787, 2.3240127563476562, 2.430952310562134, 2.5378918647766113, 2.644831418991089, 2.7517709732055664, 2.858710527420044, 2.9656500816345215, 3.07258939743042, 3.1795291900634766, 3.286468505859375, 3.3934080600738525, 3.50034761428833, 3.6072871685028076, 3.714226722717285, 3.8211662769317627, 3.9281058311462402, 4.035045146942139, 4.141984939575195]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 3.0, 11.0, 9.0, 2.0, 18.0, 19.0, 24.0, 18.0, 15.0, 25.0, 41.0, 32.0, 43.0, 39.0, 44.0, 44.0, 54.0, 50.0, 53.0, 43.0, 38.0, 49.0, 33.0, 38.0, 34.0, 28.0, 23.0, 25.0, 27.0, 23.0, 9.0, 17.0, 10.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8859353065490723, -1.8234976530075073, -1.7610599994659424, -1.6986223459243774, -1.6361846923828125, -1.5737470388412476, -1.5113093852996826, -1.4488716125488281, -1.3864340782165527, -1.3239964246749878, -1.2615587711334229, -1.199121117591858, -1.136683464050293, -1.074245810508728, -1.011808156967163, -0.9493704438209534, -0.8869327306747437, -0.8244950771331787, -0.7620574235916138, -0.6996197700500488, -0.6371821165084839, -0.574744462966919, -0.5123067498207092, -0.4498690962791443, -0.38743144273757935, -0.3249937891960144, -0.26255613565444946, -0.20011845231056213, -0.1376807987689972, -0.07524314522743225, -0.012805461883544922, 0.04963219165802002, 0.11206984519958496, 0.1745074987411499, 0.23694516718387604, 0.2993828356266022, 0.3618204891681671, 0.42425814270973206, 0.4866958260536194, 0.5491334795951843, 0.6115711331367493, 0.6740087866783142, 0.7364464402198792, 0.7988841533660889, 0.8613218069076538, 0.9237594604492188, 0.9861971139907837, 1.0486347675323486, 1.1110724210739136, 1.1735100746154785, 1.2359477281570435, 1.2983853816986084, 1.3608230352401733, 1.4232606887817383, 1.4856984615325928, 1.5481359958648682, 1.6105737686157227, 1.6730114221572876, 1.7354490756988525, 1.7978867292404175, 1.8603243827819824, 1.9227620363235474, 1.9851996898651123, 2.047637462615967, 2.110074996948242]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 13.0, 20.0, 26.0, 54.0, 73.0, 111.0, 186.0, 353.0, 696.0, 1361.0, 2774.0, 6229.0, 16640.0, 51943.0, 186105.0, 454966.0, 230451.0, 63044.0, 19902.0, 7367.0, 3111.0, 1440.0, 715.0, 398.0, 214.0, 125.0, 74.0, 56.0, 31.0, 28.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -3.00347900390625, -2.9190673828125, -2.83465576171875, -2.750244140625, -2.66583251953125, -2.5814208984375, -2.49700927734375, -2.41259765625, -2.32818603515625, -2.2437744140625, -2.15936279296875, -2.074951171875, -1.99053955078125, -1.9061279296875, -1.82171630859375, -1.7373046875, -1.65289306640625, -1.5684814453125, -1.48406982421875, -1.399658203125, -1.31524658203125, -1.2308349609375, -1.14642333984375, -1.06201171875, -0.97760009765625, -0.8931884765625, -0.80877685546875, -0.724365234375, -0.63995361328125, -0.5555419921875, -0.47113037109375, -0.38671875, -0.30230712890625, -0.2178955078125, -0.13348388671875, -0.049072265625, 0.03533935546875, 0.1197509765625, 0.20416259765625, 0.28857421875, 0.37298583984375, 0.4573974609375, 0.54180908203125, 0.626220703125, 0.71063232421875, 0.7950439453125, 0.87945556640625, 0.9638671875, 1.04827880859375, 1.1326904296875, 1.21710205078125, 1.301513671875, 1.38592529296875, 1.4703369140625, 1.55474853515625, 1.63916015625, 1.72357177734375, 1.8079833984375, 1.89239501953125, 1.976806640625, 2.06121826171875, 2.1456298828125, 2.23004150390625, 2.314453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 1.0, 7.0, 6.0, 6.0, 10.0, 17.0, 6.0, 21.0, 13.0, 23.0, 34.0, 33.0, 56.0, 46.0, 53.0, 67.0, 60.0, 51.0, 65.0, 70.0, 50.0, 58.0, 41.0, 30.0, 36.0, 22.0, 27.0, 18.0, 15.0, 10.0, 9.0, 5.0, 9.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7883682250976562, -0.7617950439453125, -0.7352218627929688, -0.708648681640625, -0.6820755004882812, -0.6555023193359375, -0.6289291381835938, -0.60235595703125, -0.5757827758789062, -0.5492095947265625, -0.5226364135742188, -0.496063232421875, -0.46949005126953125, -0.4429168701171875, -0.41634368896484375, -0.3897705078125, -0.36319732666015625, -0.3366241455078125, -0.31005096435546875, -0.283477783203125, -0.25690460205078125, -0.2303314208984375, -0.20375823974609375, -0.17718505859375, -0.15061187744140625, -0.1240386962890625, -0.09746551513671875, -0.070892333984375, -0.04431915283203125, -0.0177459716796875, 0.00882720947265625, 0.035400390625, 0.06197357177734375, 0.0885467529296875, 0.11511993408203125, 0.141693115234375, 0.16826629638671875, 0.1948394775390625, 0.22141265869140625, 0.24798583984375, 0.27455902099609375, 0.3011322021484375, 0.32770538330078125, 0.354278564453125, 0.38085174560546875, 0.4074249267578125, 0.43399810791015625, 0.4605712890625, 0.48714447021484375, 0.5137176513671875, 0.5402908325195312, 0.566864013671875, 0.5934371948242188, 0.6200103759765625, 0.6465835571289062, 0.67315673828125, 0.6997299194335938, 0.7263031005859375, 0.7528762817382812, 0.779449462890625, 0.8060226440429688, 0.8325958251953125, 0.8591690063476562, 0.8857421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 9.0, 17.0, 23.0, 27.0, 51.0, 68.0, 102.0, 211.0, 453.0, 845.0, 2351.0, 8293.0, 42321.0, 311490.0, 575038.0, 86763.0, 14406.0, 3659.0, 1225.0, 539.0, 274.0, 131.0, 85.0, 39.0, 39.0, 31.0, 19.0, 10.0, 10.0, 9.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.12890625, -4.011566162109375, -3.89422607421875, -3.776885986328125, -3.6595458984375, -3.542205810546875, -3.42486572265625, -3.307525634765625, -3.190185546875, -3.072845458984375, -2.95550537109375, -2.838165283203125, -2.7208251953125, -2.603485107421875, -2.48614501953125, -2.368804931640625, -2.25146484375, -2.134124755859375, -2.01678466796875, -1.899444580078125, -1.7821044921875, -1.664764404296875, -1.54742431640625, -1.430084228515625, -1.312744140625, -1.195404052734375, -1.07806396484375, -0.960723876953125, -0.8433837890625, -0.726043701171875, -0.60870361328125, -0.491363525390625, -0.3740234375, -0.256683349609375, -0.13934326171875, -0.022003173828125, 0.0953369140625, 0.212677001953125, 0.33001708984375, 0.447357177734375, 0.564697265625, 0.682037353515625, 0.79937744140625, 0.916717529296875, 1.0340576171875, 1.151397705078125, 1.26873779296875, 1.386077880859375, 1.50341796875, 1.620758056640625, 1.73809814453125, 1.855438232421875, 1.9727783203125, 2.090118408203125, 2.20745849609375, 2.324798583984375, 2.442138671875, 2.559478759765625, 2.67681884765625, 2.794158935546875, 2.9114990234375, 3.028839111328125, 3.14617919921875, 3.263519287109375, 3.380859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 15.0, 18.0, 12.0, 16.0, 21.0, 15.0, 34.0, 27.0, 31.0, 42.0, 34.0, 42.0, 55.0, 38.0, 44.0, 42.0, 44.0, 49.0, 37.0, 42.0, 54.0, 41.0, 21.0, 30.0, 32.0, 26.0, 24.0, 24.0, 16.0, 15.0, 15.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.603515625, -3.48968505859375, -3.3758544921875, -3.26202392578125, -3.148193359375, -3.03436279296875, -2.9205322265625, -2.80670166015625, -2.69287109375, -2.57904052734375, -2.4652099609375, -2.35137939453125, -2.237548828125, -2.12371826171875, -2.0098876953125, -1.89605712890625, -1.7822265625, -1.66839599609375, -1.5545654296875, -1.44073486328125, -1.326904296875, -1.21307373046875, -1.0992431640625, -0.98541259765625, -0.87158203125, -0.75775146484375, -0.6439208984375, -0.53009033203125, -0.416259765625, -0.30242919921875, -0.1885986328125, -0.07476806640625, 0.0390625, 0.15289306640625, 0.2667236328125, 0.38055419921875, 0.494384765625, 0.60821533203125, 0.7220458984375, 0.83587646484375, 0.94970703125, 1.06353759765625, 1.1773681640625, 1.29119873046875, 1.405029296875, 1.51885986328125, 1.6326904296875, 1.74652099609375, 1.8603515625, 1.97418212890625, 2.0880126953125, 2.20184326171875, 2.315673828125, 2.42950439453125, 2.5433349609375, 2.65716552734375, 2.77099609375, 2.88482666015625, 2.9986572265625, 3.11248779296875, 3.226318359375, 3.34014892578125, 3.4539794921875, 3.56781005859375, 3.681640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 10.0, 21.0, 28.0, 64.0, 102.0, 205.0, 463.0, 1336.0, 6669.0, 127401.0, 881579.0, 26203.0, 2945.0, 802.0, 330.0, 151.0, 87.0, 52.0, 24.0, 19.0, 13.0, 13.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.42578125, -6.277313232421875, -6.12884521484375, -5.980377197265625, -5.8319091796875, -5.683441162109375, -5.53497314453125, -5.386505126953125, -5.238037109375, -5.089569091796875, -4.94110107421875, -4.792633056640625, -4.6441650390625, -4.495697021484375, -4.34722900390625, -4.198760986328125, -4.05029296875, -3.901824951171875, -3.75335693359375, -3.604888916015625, -3.4564208984375, -3.307952880859375, -3.15948486328125, -3.011016845703125, -2.862548828125, -2.714080810546875, -2.56561279296875, -2.417144775390625, -2.2686767578125, -2.120208740234375, -1.97174072265625, -1.823272705078125, -1.6748046875, -1.526336669921875, -1.37786865234375, -1.229400634765625, -1.0809326171875, -0.932464599609375, -0.78399658203125, -0.635528564453125, -0.487060546875, -0.338592529296875, -0.19012451171875, -0.041656494140625, 0.1068115234375, 0.255279541015625, 0.40374755859375, 0.552215576171875, 0.70068359375, 0.849151611328125, 0.99761962890625, 1.146087646484375, 1.2945556640625, 1.443023681640625, 1.59149169921875, 1.739959716796875, 1.888427734375, 2.036895751953125, 2.18536376953125, 2.333831787109375, 2.4822998046875, 2.630767822265625, 2.77923583984375, 2.927703857421875, 3.076171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 8.0, 8.0, 17.0, 12.0, 28.0, 35.0, 40.0, 52.0, 74.0, 70.0, 77.0, 91.0, 89.0, 75.0, 83.0, 42.0, 37.0, 39.0, 27.0, 17.0, 18.0, 13.0, 7.0, 3.0, 12.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026607513427734375, -0.0002577193081378937, -0.0002493634819984436, -0.00024100765585899353, -0.00023265182971954346, -0.00022429600358009338, -0.0002159401774406433, -0.00020758435130119324, -0.00019922852516174316, -0.0001908726990222931, -0.00018251687288284302, -0.00017416104674339294, -0.00016580522060394287, -0.0001574493944644928, -0.00014909356832504272, -0.00014073774218559265, -0.00013238191604614258, -0.0001240260899066925, -0.00011567026376724243, -0.00010731443762779236, -9.895861148834229e-05, -9.060278534889221e-05, -8.224695920944214e-05, -7.389113306999207e-05, -6.553530693054199e-05, -5.717948079109192e-05, -4.8823654651641846e-05, -4.046782851219177e-05, -3.21120023727417e-05, -2.3756176233291626e-05, -1.5400350093841553e-05, -7.0445239543914795e-06, 1.3113021850585938e-06, 9.667128324508667e-06, 1.802295446395874e-05, 2.6378780603408813e-05, 3.473460674285889e-05, 4.309043288230896e-05, 5.144625902175903e-05, 5.9802085161209106e-05, 6.815791130065918e-05, 7.651373744010925e-05, 8.486956357955933e-05, 9.32253897190094e-05, 0.00010158121585845947, 0.00010993704199790955, 0.00011829286813735962, 0.0001266486942768097, 0.00013500452041625977, 0.00014336034655570984, 0.0001517161726951599, 0.00016007199883460999, 0.00016842782497406006, 0.00017678365111351013, 0.0001851394772529602, 0.00019349530339241028, 0.00020185112953186035, 0.00021020695567131042, 0.0002185627818107605, 0.00022691860795021057, 0.00023527443408966064, 0.00024363026022911072, 0.0002519860863685608, 0.00026034191250801086, 0.00026869773864746094]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 15.0, 14.0, 22.0, 35.0, 57.0, 90.0, 154.0, 285.0, 535.0, 1312.0, 3756.0, 14158.0, 97156.0, 756302.0, 148900.0, 18400.0, 4364.0, 1574.0, 660.0, 317.0, 175.0, 82.0, 56.0, 38.0, 18.0, 15.0, 17.0, 8.0, 5.0, 2.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.36724853515625, -2.2872314453125, -2.20721435546875, -2.127197265625, -2.04718017578125, -1.9671630859375, -1.88714599609375, -1.80712890625, -1.72711181640625, -1.6470947265625, -1.56707763671875, -1.487060546875, -1.40704345703125, -1.3270263671875, -1.24700927734375, -1.1669921875, -1.08697509765625, -1.0069580078125, -0.92694091796875, -0.846923828125, -0.76690673828125, -0.6868896484375, -0.60687255859375, -0.52685546875, -0.44683837890625, -0.3668212890625, -0.28680419921875, -0.206787109375, -0.12677001953125, -0.0467529296875, 0.03326416015625, 0.11328125, 0.19329833984375, 0.2733154296875, 0.35333251953125, 0.433349609375, 0.51336669921875, 0.5933837890625, 0.67340087890625, 0.75341796875, 0.83343505859375, 0.9134521484375, 0.99346923828125, 1.073486328125, 1.15350341796875, 1.2335205078125, 1.31353759765625, 1.3935546875, 1.47357177734375, 1.5535888671875, 1.63360595703125, 1.713623046875, 1.79364013671875, 1.8736572265625, 1.95367431640625, 2.03369140625, 2.11370849609375, 2.1937255859375, 2.27374267578125, 2.353759765625, 2.43377685546875, 2.5137939453125, 2.59381103515625, 2.673828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 12.0, 10.0, 14.0, 14.0, 19.0, 43.0, 71.0, 108.0, 113.0, 111.0, 126.0, 111.0, 60.0, 50.0, 31.0, 23.0, 18.0, 19.0, 13.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701171875, -2.612945556640625, -2.52471923828125, -2.436492919921875, -2.3482666015625, -2.260040283203125, -2.17181396484375, -2.083587646484375, -1.995361328125, -1.907135009765625, -1.81890869140625, -1.730682373046875, -1.6424560546875, -1.554229736328125, -1.46600341796875, -1.377777099609375, -1.28955078125, -1.201324462890625, -1.11309814453125, -1.024871826171875, -0.9366455078125, -0.848419189453125, -0.76019287109375, -0.671966552734375, -0.583740234375, -0.495513916015625, -0.40728759765625, -0.319061279296875, -0.2308349609375, -0.142608642578125, -0.05438232421875, 0.033843994140625, 0.1220703125, 0.210296630859375, 0.29852294921875, 0.386749267578125, 0.4749755859375, 0.563201904296875, 0.65142822265625, 0.739654541015625, 0.827880859375, 0.916107177734375, 1.00433349609375, 1.092559814453125, 1.1807861328125, 1.269012451171875, 1.35723876953125, 1.445465087890625, 1.53369140625, 1.621917724609375, 1.71014404296875, 1.798370361328125, 1.8865966796875, 1.974822998046875, 2.06304931640625, 2.151275634765625, 2.239501953125, 2.327728271484375, 2.41595458984375, 2.504180908203125, 2.5924072265625, 2.680633544921875, 2.76885986328125, 2.857086181640625, 2.9453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 18.0, 29.0, 64.0, 91.0, 126.0, 167.0, 154.0, 118.0, 86.0, 61.0, 28.0, 24.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.20188903808594, -38.04933547973633, -36.89678192138672, -35.74422836303711, -34.5916748046875, -33.439125061035156, -32.28656768798828, -31.134017944335938, -29.981464385986328, -28.82891082763672, -27.67635726928711, -26.5238037109375, -25.371252059936523, -24.218698501586914, -23.066144943237305, -21.913593292236328, -20.761037826538086, -19.608484268188477, -18.455930709838867, -17.30337905883789, -16.15082550048828, -14.998271942138672, -13.845718383789062, -12.69316577911377, -11.54061222076416, -10.38805866241455, -9.235506057739258, -8.082952499389648, -6.930399417877197, -5.777846336364746, -4.625292778015137, -3.4727401733398438, -2.3201866149902344, -1.1676334142684937, -0.01508021354675293, 1.1374731063842773, 2.2900261878967285, 3.4425792694091797, 4.595132827758789, 5.747685432434082, 6.900238990783691, 8.0527925491333, 9.205345153808594, 10.357898712158203, 11.510452270507812, 12.663004875183105, 13.815558433532715, 14.968111038208008, 16.120664596557617, 17.273218154907227, 18.425771713256836, 19.578323364257812, 20.730876922607422, 21.88343048095703, 23.03598403930664, 24.18853759765625, 25.34109115600586, 26.49364471435547, 27.646198272705078, 28.798751831054688, 29.951303482055664, 31.103857040405273, 32.25640869140625, 33.40896224975586, 34.56151580810547]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 11.0, 26.0, 20.0, 31.0, 42.0, 48.0, 60.0, 67.0, 76.0, 71.0, 77.0, 70.0, 66.0, 71.0, 51.0, 47.0, 37.0, 24.0, 18.0, 20.0, 14.0, 11.0, 10.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.44010353088379, -18.615272521972656, -17.790443420410156, -16.965612411499023, -16.14078140258789, -15.315950393676758, -14.491120338439941, -13.666290283203125, -12.841459274291992, -12.01662826538086, -11.191798210144043, -10.366968154907227, -9.542137145996094, -8.717306137084961, -7.8924760818481445, -7.06764554977417, -6.242815017700195, -5.417984485626221, -4.593153953552246, -3.7683234214782715, -2.943492889404297, -2.1186623573303223, -1.2938318252563477, -0.46900129318237305, 0.35582923889160156, 1.1806597709655762, 2.005490303039551, 2.8303208351135254, 3.6551513671875, 4.479981899261475, 5.304812431335449, 6.129642963409424, 6.954475402832031, 7.779305934906006, 8.60413646697998, 9.428966522216797, 10.25379753112793, 11.078628540039062, 11.903458595275879, 12.728288650512695, 13.553119659423828, 14.377950668334961, 15.202780723571777, 16.027610778808594, 16.852441787719727, 17.67727279663086, 18.50210189819336, 19.326932907104492, 20.151763916015625, 20.976594924926758, 21.80142593383789, 22.62625503540039, 23.451086044311523, 24.275917053222656, 25.100746154785156, 25.92557716369629, 26.750408172607422, 27.575239181518555, 28.400070190429688, 29.224899291992188, 30.04973030090332, 30.874561309814453, 31.699390411376953, 32.52422332763672, 33.34905242919922]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 7.0, 9.0, 22.0, 22.0, 38.0, 62.0, 66.0, 117.0, 183.0, 293.0, 473.0, 858.0, 1573.0, 3315.0, 7411.0, 24141.0, 193121.0, 3891738.0, 49593.0, 11909.0, 4640.0, 2078.0, 1057.0, 581.0, 350.0, 200.0, 132.0, 101.0, 52.0, 37.0, 35.0, 18.0, 12.0, 7.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.001068115234375, -2.89080810546875, -2.780548095703125, -2.6702880859375, -2.560028076171875, -2.44976806640625, -2.339508056640625, -2.229248046875, -2.118988037109375, -2.00872802734375, -1.898468017578125, -1.7882080078125, -1.677947998046875, -1.56768798828125, -1.457427978515625, -1.34716796875, -1.236907958984375, -1.12664794921875, -1.016387939453125, -0.9061279296875, -0.795867919921875, -0.68560791015625, -0.575347900390625, -0.465087890625, -0.354827880859375, -0.24456787109375, -0.134307861328125, -0.0240478515625, 0.086212158203125, 0.19647216796875, 0.306732177734375, 0.4169921875, 0.527252197265625, 0.63751220703125, 0.747772216796875, 0.8580322265625, 0.968292236328125, 1.07855224609375, 1.188812255859375, 1.299072265625, 1.409332275390625, 1.51959228515625, 1.629852294921875, 1.7401123046875, 1.850372314453125, 1.96063232421875, 2.070892333984375, 2.18115234375, 2.291412353515625, 2.40167236328125, 2.511932373046875, 2.6221923828125, 2.732452392578125, 2.84271240234375, 2.952972412109375, 3.063232421875, 3.173492431640625, 3.28375244140625, 3.394012451171875, 3.5042724609375, 3.614532470703125, 3.72479248046875, 3.835052490234375, 3.9453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 6.0, 2.0, 9.0, 9.0, 6.0, 14.0, 16.0, 22.0, 28.0, 36.0, 53.0, 69.0, 74.0, 83.0, 92.0, 80.0, 97.0, 89.0, 58.0, 48.0, 33.0, 26.0, 19.0, 14.0, 6.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8650436401367188, -0.8233489990234375, -0.7816543579101562, -0.739959716796875, -0.6982650756835938, -0.6565704345703125, -0.6148757934570312, -0.57318115234375, -0.5314865112304688, -0.4897918701171875, -0.44809722900390625, -0.406402587890625, -0.36470794677734375, -0.3230133056640625, -0.28131866455078125, -0.2396240234375, -0.19792938232421875, -0.1562347412109375, -0.11454010009765625, -0.072845458984375, -0.03115081787109375, 0.0105438232421875, 0.05223846435546875, 0.09393310546875, 0.13562774658203125, 0.1773223876953125, 0.21901702880859375, 0.260711669921875, 0.30240631103515625, 0.3441009521484375, 0.38579559326171875, 0.427490234375, 0.46918487548828125, 0.5108795166015625, 0.5525741577148438, 0.594268798828125, 0.6359634399414062, 0.6776580810546875, 0.7193527221679688, 0.76104736328125, 0.8027420043945312, 0.8444366455078125, 0.8861312866210938, 0.927825927734375, 0.9695205688476562, 1.0112152099609375, 1.0529098510742188, 1.0946044921875, 1.1362991333007812, 1.1779937744140625, 1.2196884155273438, 1.261383056640625, 1.3030776977539062, 1.3447723388671875, 1.3864669799804688, 1.42816162109375, 1.4698562622070312, 1.5115509033203125, 1.5532455444335938, 1.594940185546875, 1.6366348266601562, 1.6783294677734375, 1.7200241088867188, 1.76171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 6.0, 6.0, 8.0, 13.0, 13.0, 20.0, 23.0, 27.0, 49.0, 76.0, 113.0, 224.0, 471.0, 1274.0, 3894.0, 15794.0, 174937.0, 3943429.0, 42916.0, 7356.0, 2021.0, 776.0, 344.0, 166.0, 88.0, 59.0, 43.0, 45.0, 14.0, 11.0, 12.0, 6.0, 8.0, 7.0, 6.0, 3.0, 4.0, 3.0, 9.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.703125, -7.484619140625, -7.26611328125, -7.047607421875, -6.8291015625, -6.610595703125, -6.39208984375, -6.173583984375, -5.955078125, -5.736572265625, -5.51806640625, -5.299560546875, -5.0810546875, -4.862548828125, -4.64404296875, -4.425537109375, -4.20703125, -3.988525390625, -3.77001953125, -3.551513671875, -3.3330078125, -3.114501953125, -2.89599609375, -2.677490234375, -2.458984375, -2.240478515625, -2.02197265625, -1.803466796875, -1.5849609375, -1.366455078125, -1.14794921875, -0.929443359375, -0.7109375, -0.492431640625, -0.27392578125, -0.055419921875, 0.1630859375, 0.381591796875, 0.60009765625, 0.818603515625, 1.037109375, 1.255615234375, 1.47412109375, 1.692626953125, 1.9111328125, 2.129638671875, 2.34814453125, 2.566650390625, 2.78515625, 3.003662109375, 3.22216796875, 3.440673828125, 3.6591796875, 3.877685546875, 4.09619140625, 4.314697265625, 4.533203125, 4.751708984375, 4.97021484375, 5.188720703125, 5.4072265625, 5.625732421875, 5.84423828125, 6.062744140625, 6.28125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 4.0, 4.0, 11.0, 16.0, 20.0, 23.0, 19.0, 29.0, 58.0, 103.0, 238.0, 2845.0, 364.0, 128.0, 68.0, 55.0, 22.0, 20.0, 12.0, 10.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.1780242919921875, -2.121673583984375, -2.0653228759765625, -2.00897216796875, -1.9526214599609375, -1.896270751953125, -1.8399200439453125, -1.7835693359375, -1.7272186279296875, -1.670867919921875, -1.6145172119140625, -1.55816650390625, -1.5018157958984375, -1.445465087890625, -1.3891143798828125, -1.332763671875, -1.2764129638671875, -1.220062255859375, -1.1637115478515625, -1.10736083984375, -1.0510101318359375, -0.994659423828125, -0.9383087158203125, -0.8819580078125, -0.8256072998046875, -0.769256591796875, -0.7129058837890625, -0.65655517578125, -0.6002044677734375, -0.543853759765625, -0.4875030517578125, -0.43115234375, -0.3748016357421875, -0.318450927734375, -0.2621002197265625, -0.20574951171875, -0.1493988037109375, -0.093048095703125, -0.0366973876953125, 0.0196533203125, 0.0760040283203125, 0.132354736328125, 0.1887054443359375, 0.24505615234375, 0.3014068603515625, 0.357757568359375, 0.4141082763671875, 0.470458984375, 0.5268096923828125, 0.583160400390625, 0.6395111083984375, 0.69586181640625, 0.7522125244140625, 0.808563232421875, 0.8649139404296875, 0.9212646484375, 0.9776153564453125, 1.033966064453125, 1.0903167724609375, 1.14666748046875, 1.2030181884765625, 1.259368896484375, 1.3157196044921875, 1.3720703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 7.0, 9.0, 22.0, 30.0, 48.0, 71.0, 119.0, 134.0, 175.0, 166.0, 100.0, 61.0, 29.0, 14.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.355575561523438, -18.96014404296875, -18.56471061706543, -18.169279098510742, -17.773845672607422, -17.378414154052734, -16.982982635498047, -16.587549209594727, -16.19211769104004, -15.796685218811035, -15.401252746582031, -15.005821228027344, -14.61038875579834, -14.214956283569336, -13.819524765014648, -13.424092292785645, -13.02865982055664, -12.633227348327637, -12.237794876098633, -11.842363357543945, -11.446930885314941, -11.051498413085938, -10.65606689453125, -10.260634422302246, -9.865201950073242, -9.469769477844238, -9.074337005615234, -8.678905487060547, -8.283473014831543, -7.888040542602539, -7.492608547210693, -7.097176551818848, -6.7017436027526855, -6.30631160736084, -5.910879135131836, -5.515446662902832, -5.120014667510986, -4.724582672119141, -4.329150199890137, -3.933717966079712, -3.538285732269287, -3.1428534984588623, -2.7474212646484375, -2.3519890308380127, -1.956556797027588, -1.561124563217163, -1.1656923294067383, -0.7702600955963135, -0.37482786178588867, 0.020604372024536133, 0.41603660583496094, 0.8114688396453857, 1.2069010734558105, 1.6023333072662354, 1.9977655410766602, 2.393197774887085, 2.7886300086975098, 3.1840622425079346, 3.5794944763183594, 3.974926710128784, 4.370358943939209, 4.765790939331055, 5.161223411560059, 5.5566558837890625, 5.952087879180908]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 3.0, 6.0, 6.0, 9.0, 14.0, 11.0, 16.0, 18.0, 17.0, 22.0, 16.0, 21.0, 27.0, 30.0, 34.0, 38.0, 39.0, 35.0, 38.0, 36.0, 37.0, 39.0, 42.0, 28.0, 33.0, 37.0, 40.0, 29.0, 28.0, 28.0, 31.0, 23.0, 25.0, 23.0, 9.0, 17.0, 10.0, 13.0, 12.0, 7.0, 12.0, 5.0, 7.0, 3.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.132979869842529, -4.982744216918945, -4.832508563995361, -4.682272911071777, -4.532036781311035, -4.381801128387451, -4.231565475463867, -4.081329822540283, -3.931094169616699, -3.7808585166931152, -3.6306228637695312, -3.480386972427368, -3.330151319503784, -3.1799156665802, -3.029679775238037, -2.879444122314453, -2.729208469390869, -2.578972816467285, -2.428737163543701, -2.278501272201538, -2.128265619277954, -1.9780299663543701, -1.8277941942214966, -1.677558422088623, -1.527322769165039, -1.377087116241455, -1.2268513441085815, -1.076615571975708, -0.926379919052124, -0.7761442065238953, -0.6259084939956665, -0.47567272186279297, -0.3254365921020508, -0.17520087957382202, -0.02496516704559326, 0.1252705454826355, 0.27550625801086426, 0.425741970539093, 0.5759776830673218, 0.7262134552001953, 0.8764491081237793, 1.0266847610473633, 1.1769205331802368, 1.3271563053131104, 1.4773919582366943, 1.6276276111602783, 1.7778633832931519, 1.9280991554260254, 2.0783348083496094, 2.2285704612731934, 2.3788061141967773, 2.5290420055389404, 2.6792776584625244, 2.8295133113861084, 2.9797492027282715, 3.1299848556518555, 3.2802205085754395, 3.4304561614990234, 3.5806918144226074, 3.7309277057647705, 3.8811633586883545, 4.031399250030518, 4.181634902954102, 4.3318705558776855, 4.4821062088012695]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 5.0, 6.0, 11.0, 12.0, 28.0, 45.0, 67.0, 128.0, 233.0, 483.0, 954.0, 2349.0, 6205.0, 19068.0, 70910.0, 278839.0, 457058.0, 154811.0, 38938.0, 11451.0, 3979.0, 1544.0, 677.0, 346.0, 175.0, 98.0, 51.0, 25.0, 15.0, 15.0, 3.0, 7.0, 10.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.842376708984375, -2.74530029296875, -2.648223876953125, -2.5511474609375, -2.454071044921875, -2.35699462890625, -2.259918212890625, -2.162841796875, -2.065765380859375, -1.96868896484375, -1.871612548828125, -1.7745361328125, -1.677459716796875, -1.58038330078125, -1.483306884765625, -1.38623046875, -1.289154052734375, -1.19207763671875, -1.095001220703125, -0.9979248046875, -0.900848388671875, -0.80377197265625, -0.706695556640625, -0.609619140625, -0.512542724609375, -0.41546630859375, -0.318389892578125, -0.2213134765625, -0.124237060546875, -0.02716064453125, 0.069915771484375, 0.1669921875, 0.264068603515625, 0.36114501953125, 0.458221435546875, 0.5552978515625, 0.652374267578125, 0.74945068359375, 0.846527099609375, 0.943603515625, 1.040679931640625, 1.13775634765625, 1.234832763671875, 1.3319091796875, 1.428985595703125, 1.52606201171875, 1.623138427734375, 1.72021484375, 1.817291259765625, 1.91436767578125, 2.011444091796875, 2.1085205078125, 2.205596923828125, 2.30267333984375, 2.399749755859375, 2.496826171875, 2.593902587890625, 2.69097900390625, 2.788055419921875, 2.8851318359375, 2.982208251953125, 3.07928466796875, 3.176361083984375, 3.2734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 12.0, 15.0, 15.0, 24.0, 32.0, 51.0, 73.0, 91.0, 97.0, 91.0, 94.0, 85.0, 88.0, 59.0, 49.0, 29.0, 23.0, 22.0, 14.0, 12.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4013671875, -1.3430633544921875, -1.284759521484375, -1.2264556884765625, -1.16815185546875, -1.1098480224609375, -1.051544189453125, -0.9932403564453125, -0.9349365234375, -0.8766326904296875, -0.818328857421875, -0.7600250244140625, -0.70172119140625, -0.6434173583984375, -0.585113525390625, -0.5268096923828125, -0.468505859375, -0.4102020263671875, -0.351898193359375, -0.2935943603515625, -0.23529052734375, -0.1769866943359375, -0.118682861328125, -0.0603790283203125, -0.0020751953125, 0.0562286376953125, 0.114532470703125, 0.1728363037109375, 0.23114013671875, 0.2894439697265625, 0.347747802734375, 0.4060516357421875, 0.46435546875, 0.5226593017578125, 0.580963134765625, 0.6392669677734375, 0.69757080078125, 0.7558746337890625, 0.814178466796875, 0.8724822998046875, 0.9307861328125, 0.9890899658203125, 1.047393798828125, 1.1056976318359375, 1.16400146484375, 1.2223052978515625, 1.280609130859375, 1.3389129638671875, 1.397216796875, 1.4555206298828125, 1.513824462890625, 1.5721282958984375, 1.63043212890625, 1.6887359619140625, 1.747039794921875, 1.8053436279296875, 1.8636474609375, 1.9219512939453125, 1.980255126953125, 2.0385589599609375, 2.09686279296875, 2.1551666259765625, 2.213470458984375, 2.2717742919921875, 2.330078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 15.0, 23.0, 30.0, 57.0, 87.0, 140.0, 278.0, 529.0, 1335.0, 4419.0, 27167.0, 404348.0, 564616.0, 37165.0, 5475.0, 1555.0, 592.0, 282.0, 158.0, 103.0, 62.0, 32.0, 24.0, 14.0, 7.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.6409912109375, -6.446044921875, -6.2510986328125, -6.05615234375, -5.8612060546875, -5.666259765625, -5.4713134765625, -5.2763671875, -5.0814208984375, -4.886474609375, -4.6915283203125, -4.49658203125, -4.3016357421875, -4.106689453125, -3.9117431640625, -3.716796875, -3.5218505859375, -3.326904296875, -3.1319580078125, -2.93701171875, -2.7420654296875, -2.547119140625, -2.3521728515625, -2.1572265625, -1.9622802734375, -1.767333984375, -1.5723876953125, -1.37744140625, -1.1824951171875, -0.987548828125, -0.7926025390625, -0.59765625, -0.4027099609375, -0.207763671875, -0.0128173828125, 0.18212890625, 0.3770751953125, 0.572021484375, 0.7669677734375, 0.9619140625, 1.1568603515625, 1.351806640625, 1.5467529296875, 1.74169921875, 1.9366455078125, 2.131591796875, 2.3265380859375, 2.521484375, 2.7164306640625, 2.911376953125, 3.1063232421875, 3.30126953125, 3.4962158203125, 3.691162109375, 3.8861083984375, 4.0810546875, 4.2760009765625, 4.470947265625, 4.6658935546875, 4.86083984375, 5.0557861328125, 5.250732421875, 5.4456787109375, 5.640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 11.0, 10.0, 7.0, 14.0, 20.0, 15.0, 24.0, 40.0, 45.0, 39.0, 45.0, 71.0, 62.0, 64.0, 56.0, 61.0, 63.0, 47.0, 50.0, 48.0, 38.0, 34.0, 21.0, 23.0, 26.0, 16.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.79351806640625, -5.5831298828125, -5.37274169921875, -5.162353515625, -4.95196533203125, -4.7415771484375, -4.53118896484375, -4.32080078125, -4.11041259765625, -3.9000244140625, -3.68963623046875, -3.479248046875, -3.26885986328125, -3.0584716796875, -2.84808349609375, -2.6376953125, -2.42730712890625, -2.2169189453125, -2.00653076171875, -1.796142578125, -1.58575439453125, -1.3753662109375, -1.16497802734375, -0.95458984375, -0.74420166015625, -0.5338134765625, -0.32342529296875, -0.113037109375, 0.09735107421875, 0.3077392578125, 0.51812744140625, 0.728515625, 0.93890380859375, 1.1492919921875, 1.35968017578125, 1.570068359375, 1.78045654296875, 1.9908447265625, 2.20123291015625, 2.41162109375, 2.62200927734375, 2.8323974609375, 3.04278564453125, 3.253173828125, 3.46356201171875, 3.6739501953125, 3.88433837890625, 4.0947265625, 4.30511474609375, 4.5155029296875, 4.72589111328125, 4.936279296875, 5.14666748046875, 5.3570556640625, 5.56744384765625, 5.77783203125, 5.98822021484375, 6.1986083984375, 6.40899658203125, 6.619384765625, 6.82977294921875, 7.0401611328125, 7.25054931640625, 7.4609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 12.0, 28.0, 39.0, 54.0, 90.0, 197.0, 478.0, 1357.0, 7769.0, 307119.0, 715249.0, 13234.0, 1820.0, 593.0, 230.0, 97.0, 58.0, 40.0, 23.0, 13.0, 11.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.779296875, -3.665130615234375, -3.55096435546875, -3.436798095703125, -3.3226318359375, -3.208465576171875, -3.09429931640625, -2.980133056640625, -2.865966796875, -2.751800537109375, -2.63763427734375, -2.523468017578125, -2.4093017578125, -2.295135498046875, -2.18096923828125, -2.066802978515625, -1.95263671875, -1.838470458984375, -1.72430419921875, -1.610137939453125, -1.4959716796875, -1.381805419921875, -1.26763916015625, -1.153472900390625, -1.039306640625, -0.925140380859375, -0.81097412109375, -0.696807861328125, -0.5826416015625, -0.468475341796875, -0.35430908203125, -0.240142822265625, -0.1259765625, -0.011810302734375, 0.10235595703125, 0.216522216796875, 0.3306884765625, 0.444854736328125, 0.55902099609375, 0.673187255859375, 0.787353515625, 0.901519775390625, 1.01568603515625, 1.129852294921875, 1.2440185546875, 1.358184814453125, 1.47235107421875, 1.586517333984375, 1.70068359375, 1.814849853515625, 1.92901611328125, 2.043182373046875, 2.1573486328125, 2.271514892578125, 2.38568115234375, 2.499847412109375, 2.614013671875, 2.728179931640625, 2.84234619140625, 2.956512451171875, 3.0706787109375, 3.184844970703125, 3.29901123046875, 3.413177490234375, 3.52734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 20.0, 31.0, 35.0, 36.0, 73.0, 82.0, 98.0, 113.0, 101.0, 83.0, 71.0, 50.0, 46.0, 42.0, 26.0, 15.0, 18.0, 13.0, 5.0, 2.0, 3.0, 3.0, 7.0, 3.0, 2.0], "bins": [-0.00048828125, -0.0004778541624546051, -0.0004674270749092102, -0.0004569999873638153, -0.0004465728998184204, -0.0004361458122730255, -0.0004257187247276306, -0.0004152916371822357, -0.0004048645496368408, -0.0003944374620914459, -0.000384010374546051, -0.00037358328700065613, -0.00036315619945526123, -0.00035272911190986633, -0.00034230202436447144, -0.00033187493681907654, -0.00032144784927368164, -0.00031102076172828674, -0.00030059367418289185, -0.00029016658663749695, -0.00027973949909210205, -0.00026931241154670715, -0.00025888532400131226, -0.00024845823645591736, -0.00023803114891052246, -0.00022760406136512756, -0.00021717697381973267, -0.00020674988627433777, -0.00019632279872894287, -0.00018589571118354797, -0.00017546862363815308, -0.00016504153609275818, -0.00015461444854736328, -0.00014418736100196838, -0.00013376027345657349, -0.0001233331859111786, -0.00011290609836578369, -0.0001024790108203888, -9.20519232749939e-05, -8.1624835729599e-05, -7.11977481842041e-05, -6.0770660638809204e-05, -5.034357309341431e-05, -3.991648554801941e-05, -2.9489398002624512e-05, -1.9062310457229614e-05, -8.635222911834717e-06, 1.7918646335601807e-06, 1.2218952178955078e-05, 2.2646039724349976e-05, 3.307312726974487e-05, 4.350021481513977e-05, 5.392730236053467e-05, 6.435438990592957e-05, 7.478147745132446e-05, 8.520856499671936e-05, 9.563565254211426e-05, 0.00010606274008750916, 0.00011648982763290405, 0.00012691691517829895, 0.00013734400272369385, 0.00014777109026908875, 0.00015819817781448364, 0.00016862526535987854, 0.00017905235290527344]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 13.0, 20.0, 43.0, 71.0, 167.0, 358.0, 962.0, 3451.0, 26764.0, 718476.0, 282798.0, 12024.0, 2125.0, 687.0, 275.0, 142.0, 62.0, 36.0, 18.0, 7.0, 11.0, 3.0, 5.0, 5.0, 0.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.51171875, -2.42755126953125, -2.3433837890625, -2.25921630859375, -2.175048828125, -2.09088134765625, -2.0067138671875, -1.92254638671875, -1.83837890625, -1.75421142578125, -1.6700439453125, -1.58587646484375, -1.501708984375, -1.41754150390625, -1.3333740234375, -1.24920654296875, -1.1650390625, -1.08087158203125, -0.9967041015625, -0.91253662109375, -0.828369140625, -0.74420166015625, -0.6600341796875, -0.57586669921875, -0.49169921875, -0.40753173828125, -0.3233642578125, -0.23919677734375, -0.155029296875, -0.07086181640625, 0.0133056640625, 0.09747314453125, 0.181640625, 0.26580810546875, 0.3499755859375, 0.43414306640625, 0.518310546875, 0.60247802734375, 0.6866455078125, 0.77081298828125, 0.85498046875, 0.93914794921875, 1.0233154296875, 1.10748291015625, 1.191650390625, 1.27581787109375, 1.3599853515625, 1.44415283203125, 1.5283203125, 1.61248779296875, 1.6966552734375, 1.78082275390625, 1.864990234375, 1.94915771484375, 2.0333251953125, 2.11749267578125, 2.20166015625, 2.28582763671875, 2.3699951171875, 2.45416259765625, 2.538330078125, 2.62249755859375, 2.7066650390625, 2.79083251953125, 2.875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 15.0, 24.0, 34.0, 46.0, 99.0, 120.0, 145.0, 147.0, 126.0, 73.0, 68.0, 28.0, 30.0, 14.0, 11.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.341064453125, -3.24267578125, -3.144287109375, -3.0458984375, -2.947509765625, -2.84912109375, -2.750732421875, -2.65234375, -2.553955078125, -2.45556640625, -2.357177734375, -2.2587890625, -2.160400390625, -2.06201171875, -1.963623046875, -1.865234375, -1.766845703125, -1.66845703125, -1.570068359375, -1.4716796875, -1.373291015625, -1.27490234375, -1.176513671875, -1.078125, -0.979736328125, -0.88134765625, -0.782958984375, -0.6845703125, -0.586181640625, -0.48779296875, -0.389404296875, -0.291015625, -0.192626953125, -0.09423828125, 0.004150390625, 0.1025390625, 0.200927734375, 0.29931640625, 0.397705078125, 0.49609375, 0.594482421875, 0.69287109375, 0.791259765625, 0.8896484375, 0.988037109375, 1.08642578125, 1.184814453125, 1.283203125, 1.381591796875, 1.47998046875, 1.578369140625, 1.6767578125, 1.775146484375, 1.87353515625, 1.971923828125, 2.0703125, 2.168701171875, 2.26708984375, 2.365478515625, 2.4638671875, 2.562255859375, 2.66064453125, 2.759033203125, 2.857421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 18.0, 24.0, 45.0, 52.0, 84.0, 105.0, 144.0, 150.0, 106.0, 84.0, 65.0, 38.0, 24.0, 14.0, 7.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.288166046142578, -22.266162872314453, -21.244159698486328, -20.222156524658203, -19.200153350830078, -18.178150177001953, -17.156147003173828, -16.134143829345703, -15.112140655517578, -14.090137481689453, -13.068134307861328, -12.046131134033203, -11.024127960205078, -10.002124786376953, -8.980121612548828, -7.958118438720703, -6.936115264892578, -5.914112091064453, -4.892108917236328, -3.870105743408203, -2.848102569580078, -1.8260993957519531, -0.8040962219238281, 0.21790695190429688, 1.2399101257324219, 2.261913299560547, 3.283916473388672, 4.305919647216797, 5.327922821044922, 6.349925994873047, 7.371929168701172, 8.393932342529297, 9.415931701660156, 10.437934875488281, 11.459938049316406, 12.481941223144531, 13.503944396972656, 14.525947570800781, 15.547950744628906, 16.56995391845703, 17.591957092285156, 18.61396026611328, 19.635963439941406, 20.65796661376953, 21.679969787597656, 22.70197296142578, 23.723976135253906, 24.74597930908203, 25.767982482910156, 26.78998565673828, 27.811988830566406, 28.83399200439453, 29.855995178222656, 30.87799835205078, 31.900001525878906, 32.92200469970703, 33.944007873535156, 34.96601104736328, 35.988014221191406, 37.01001739501953, 38.032020568847656, 39.05402374267578, 40.076026916503906, 41.09803009033203, 42.120033264160156]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 4.0, 6.0, 4.0, 23.0, 22.0, 20.0, 35.0, 41.0, 37.0, 41.0, 70.0, 53.0, 66.0, 83.0, 73.0, 57.0, 58.0, 49.0, 54.0, 41.0, 40.0, 26.0, 17.0, 17.0, 17.0, 12.0, 15.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.04898452758789, -41.99481964111328, -40.94065856933594, -39.88649368286133, -38.83232879638672, -37.778167724609375, -36.724002838134766, -35.669837951660156, -34.61567687988281, -33.5615119934082, -32.50735092163086, -31.45318603515625, -30.399023056030273, -29.344860076904297, -28.290695190429688, -27.23653221130371, -26.1823673248291, -25.128204345703125, -24.074039459228516, -23.01987648010254, -21.965713500976562, -20.911548614501953, -19.857385635375977, -18.80322265625, -17.74905776977539, -16.694894790649414, -15.640730857849121, -14.586566925048828, -13.532403945922852, -12.478240013122559, -11.424076080322266, -10.369913101196289, -9.315750122070312, -8.26158618927002, -7.207423210144043, -6.15325927734375, -5.099095821380615, -4.0449323654174805, -2.9907684326171875, -1.9366049766540527, -0.882441520690918, 0.17172205448150635, 1.2258856296539307, 2.2800493240356445, 3.3342127799987793, 4.388376235961914, 5.442540168762207, 6.496703624725342, 7.550867080688477, 8.60503101348877, 9.659193992614746, 10.713357925415039, 11.767520904541016, 12.821684837341309, 13.875848770141602, 14.930011749267578, 15.984175682067871, 17.038339614868164, 18.09250259399414, 19.14666748046875, 20.200830459594727, 21.254993438720703, 22.309158325195312, 23.36332130432129, 24.417484283447266]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 12.0, 10.0, 11.0, 19.0, 30.0, 29.0, 26.0, 33.0, 80.0, 124.0, 205.0, 417.0, 1140.0, 4761.0, 39581.0, 3667780.0, 456034.0, 19420.0, 3448.0, 741.0, 234.0, 79.0, 34.0, 11.0, 9.0, 4.0, 4.0], "bins": [-9.2421875, -9.067214965820312, -8.892242431640625, -8.717269897460938, -8.54229736328125, -8.367324829101562, -8.192352294921875, -8.017379760742188, -7.8424072265625, -7.6674346923828125, -7.492462158203125, -7.3174896240234375, -7.14251708984375, -6.9675445556640625, -6.792572021484375, -6.6175994873046875, -6.442626953125, -6.2676544189453125, -6.092681884765625, -5.9177093505859375, -5.74273681640625, -5.5677642822265625, -5.392791748046875, -5.2178192138671875, -5.0428466796875, -4.8678741455078125, -4.692901611328125, -4.5179290771484375, -4.34295654296875, -4.1679840087890625, -3.993011474609375, -3.8180389404296875, -3.64306640625, -3.4680938720703125, -3.293121337890625, -3.1181488037109375, -2.94317626953125, -2.7682037353515625, -2.593231201171875, -2.4182586669921875, -2.2432861328125, -2.0683135986328125, -1.893341064453125, -1.7183685302734375, -1.54339599609375, -1.3684234619140625, -1.193450927734375, -1.0184783935546875, -0.843505859375, -0.6685333251953125, -0.493560791015625, -0.3185882568359375, -0.14361572265625, 0.0313568115234375, 0.206329345703125, 0.3813018798828125, 0.5562744140625, 0.7312469482421875, 0.906219482421875, 1.0811920166015625, 1.25616455078125, 1.4311370849609375, 1.606109619140625, 1.7810821533203125, 1.9560546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 18.0, 30.0, 74.0, 124.0, 161.0, 162.0, 135.0, 118.0, 80.0, 40.0, 20.0, 18.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.79296875, -4.698089599609375, -4.60321044921875, -4.508331298828125, -4.4134521484375, -4.318572998046875, -4.22369384765625, -4.128814697265625, -4.033935546875, -3.939056396484375, -3.84417724609375, -3.749298095703125, -3.6544189453125, -3.559539794921875, -3.46466064453125, -3.369781494140625, -3.27490234375, -3.180023193359375, -3.08514404296875, -2.990264892578125, -2.8953857421875, -2.800506591796875, -2.70562744140625, -2.610748291015625, -2.515869140625, -2.420989990234375, -2.32611083984375, -2.231231689453125, -2.1363525390625, -2.041473388671875, -1.94659423828125, -1.851715087890625, -1.7568359375, -1.661956787109375, -1.56707763671875, -1.472198486328125, -1.3773193359375, -1.282440185546875, -1.18756103515625, -1.092681884765625, -0.997802734375, -0.902923583984375, -0.80804443359375, -0.713165283203125, -0.6182861328125, -0.523406982421875, -0.42852783203125, -0.333648681640625, -0.23876953125, -0.143890380859375, -0.04901123046875, 0.045867919921875, 0.1407470703125, 0.235626220703125, 0.33050537109375, 0.425384521484375, 0.520263671875, 0.615142822265625, 0.71002197265625, 0.804901123046875, 0.8997802734375, 0.994659423828125, 1.08953857421875, 1.184417724609375, 1.279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 19.0, 18.0, 23.0, 35.0, 66.0, 85.0, 156.0, 234.0, 410.0, 740.0, 1443.0, 3105.0, 7946.0, 25835.0, 122235.0, 2858786.0, 1062536.0, 80266.0, 18895.0, 6227.0, 2445.0, 1240.0, 662.0, 308.0, 204.0, 96.0, 77.0, 48.0, 31.0, 15.0, 14.0, 9.0, 13.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.421875, -3.314544677734375, -3.20721435546875, -3.099884033203125, -2.9925537109375, -2.885223388671875, -2.77789306640625, -2.670562744140625, -2.563232421875, -2.455902099609375, -2.34857177734375, -2.241241455078125, -2.1339111328125, -2.026580810546875, -1.91925048828125, -1.811920166015625, -1.70458984375, -1.597259521484375, -1.48992919921875, -1.382598876953125, -1.2752685546875, -1.167938232421875, -1.06060791015625, -0.953277587890625, -0.845947265625, -0.738616943359375, -0.63128662109375, -0.523956298828125, -0.4166259765625, -0.309295654296875, -0.20196533203125, -0.094635009765625, 0.0126953125, 0.120025634765625, 0.22735595703125, 0.334686279296875, 0.4420166015625, 0.549346923828125, 0.65667724609375, 0.764007568359375, 0.871337890625, 0.978668212890625, 1.08599853515625, 1.193328857421875, 1.3006591796875, 1.407989501953125, 1.51531982421875, 1.622650146484375, 1.72998046875, 1.837310791015625, 1.94464111328125, 2.051971435546875, 2.1593017578125, 2.266632080078125, 2.37396240234375, 2.481292724609375, 2.588623046875, 2.695953369140625, 2.80328369140625, 2.910614013671875, 3.0179443359375, 3.125274658203125, 3.23260498046875, 3.339935302734375, 3.447265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 9.0, 3.0, 5.0, 9.0, 20.0, 19.0, 32.0, 48.0, 75.0, 140.0, 292.0, 878.0, 1313.0, 648.0, 219.0, 133.0, 75.0, 48.0, 35.0, 28.0, 13.0, 6.0, 12.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.3680419921875, -5.216552734375, -5.0650634765625, -4.91357421875, -4.7620849609375, -4.610595703125, -4.4591064453125, -4.3076171875, -4.1561279296875, -4.004638671875, -3.8531494140625, -3.70166015625, -3.5501708984375, -3.398681640625, -3.2471923828125, -3.095703125, -2.9442138671875, -2.792724609375, -2.6412353515625, -2.48974609375, -2.3382568359375, -2.186767578125, -2.0352783203125, -1.8837890625, -1.7322998046875, -1.580810546875, -1.4293212890625, -1.27783203125, -1.1263427734375, -0.974853515625, -0.8233642578125, -0.671875, -0.5203857421875, -0.368896484375, -0.2174072265625, -0.06591796875, 0.0855712890625, 0.237060546875, 0.3885498046875, 0.5400390625, 0.6915283203125, 0.843017578125, 0.9945068359375, 1.14599609375, 1.2974853515625, 1.448974609375, 1.6004638671875, 1.751953125, 1.9034423828125, 2.054931640625, 2.2064208984375, 2.35791015625, 2.5093994140625, 2.660888671875, 2.8123779296875, 2.9638671875, 3.1153564453125, 3.266845703125, 3.4183349609375, 3.56982421875, 3.7213134765625, 3.872802734375, 4.0242919921875, 4.17578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 10.0, 18.0, 39.0, 48.0, 88.0, 109.0, 158.0, 167.0, 143.0, 85.0, 47.0, 30.0, 16.0, 12.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.949365615844727, -24.043842315673828, -23.138317108154297, -22.2327938079834, -21.327268600463867, -20.42174530029297, -19.516220092773438, -18.61069679260254, -17.70517349243164, -16.799650192260742, -15.894124984741211, -14.988601684570312, -14.083076477050781, -13.177553176879883, -12.272028923034668, -11.366504669189453, -10.460979461669922, -9.555455207824707, -8.649930953979492, -7.7444071769714355, -6.838882923126221, -5.933358669281006, -5.027834892272949, -4.122310638427734, -3.2167863845825195, -2.3112621307373047, -1.405738115310669, -0.5002140998840332, 0.40531015396118164, 1.3108344078063965, 2.216358184814453, 3.121882438659668, 4.02740478515625, 4.932929039001465, 5.83845329284668, 6.743977069854736, 7.649501323699951, 8.555025100708008, 9.460549354553223, 10.366073608398438, 11.271597862243652, 12.177122116088867, 13.082646369934082, 13.988170623779297, 14.893693923950195, 15.799219131469727, 16.704742431640625, 17.610267639160156, 18.515790939331055, 19.421314239501953, 20.326839447021484, 21.232362747192383, 22.137887954711914, 23.043411254882812, 23.948936462402344, 24.854459762573242, 25.75998306274414, 26.66550636291504, 27.57103157043457, 28.47655487060547, 29.382080078125, 30.2876033782959, 31.193126678466797, 32.09865188598633, 33.00417709350586]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 17.0, 9.0, 25.0, 35.0, 27.0, 45.0, 52.0, 67.0, 73.0, 79.0, 78.0, 70.0, 72.0, 70.0, 66.0, 52.0, 40.0, 29.0, 32.0, 19.0, 14.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.357948303222656, -16.51941680908203, -15.68088436126709, -14.842352867126465, -14.003820419311523, -13.165288925170898, -12.326757431030273, -11.488224983215332, -10.64969253540039, -9.811161041259766, -8.972628593444824, -8.1340970993042, -7.295564651489258, -6.457033157348633, -5.61850118637085, -4.779969215393066, -3.9414377212524414, -3.102905750274658, -2.264373779296875, -1.425842046737671, -0.5873100757598877, 0.2512216567993164, 1.0897536277770996, 1.9282855987548828, 2.766817569732666, 3.605349540710449, 4.443881511688232, 5.282413482666016, 6.120944976806641, 6.959476947784424, 7.798008918762207, 8.636541366577148, 9.475072860717773, 10.313604354858398, 11.15213680267334, 11.990668296813965, 12.829200744628906, 13.667732238769531, 14.506263732910156, 15.344796180725098, 16.18332862854004, 17.021860122680664, 17.86039161682129, 18.698925018310547, 19.537456512451172, 20.375988006591797, 21.214519500732422, 22.053050994873047, 22.891582489013672, 23.730113983154297, 24.568645477294922, 25.40717887878418, 26.245710372924805, 27.08424186706543, 27.922773361206055, 28.761306762695312, 29.599838256835938, 30.438369750976562, 31.276901245117188, 32.11543273925781, 32.95396423339844, 33.79249572753906, 34.63103103637695, 35.46956253051758, 36.3080940246582]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 10.0, 14.0, 21.0, 32.0, 68.0, 94.0, 200.0, 347.0, 773.0, 1685.0, 4210.0, 12335.0, 40486.0, 142520.0, 420188.0, 301727.0, 85617.0, 24863.0, 7997.0, 2886.0, 1271.0, 591.0, 282.0, 134.0, 83.0, 46.0, 23.0, 13.0, 11.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.255859375, -2.17169189453125, -2.0875244140625, -2.00335693359375, -1.919189453125, -1.83502197265625, -1.7508544921875, -1.66668701171875, -1.58251953125, -1.49835205078125, -1.4141845703125, -1.33001708984375, -1.245849609375, -1.16168212890625, -1.0775146484375, -0.99334716796875, -0.9091796875, -0.82501220703125, -0.7408447265625, -0.65667724609375, -0.572509765625, -0.48834228515625, -0.4041748046875, -0.32000732421875, -0.23583984375, -0.15167236328125, -0.0675048828125, 0.01666259765625, 0.100830078125, 0.18499755859375, 0.2691650390625, 0.35333251953125, 0.4375, 0.52166748046875, 0.6058349609375, 0.69000244140625, 0.774169921875, 0.85833740234375, 0.9425048828125, 1.02667236328125, 1.11083984375, 1.19500732421875, 1.2791748046875, 1.36334228515625, 1.447509765625, 1.53167724609375, 1.6158447265625, 1.70001220703125, 1.7841796875, 1.86834716796875, 1.9525146484375, 2.03668212890625, 2.120849609375, 2.20501708984375, 2.2891845703125, 2.37335205078125, 2.45751953125, 2.54168701171875, 2.6258544921875, 2.71002197265625, 2.794189453125, 2.87835693359375, 2.9625244140625, 3.04669189453125, 3.130859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 10.0, 19.0, 18.0, 30.0, 35.0, 51.0, 57.0, 70.0, 81.0, 95.0, 72.0, 77.0, 82.0, 57.0, 47.0, 42.0, 51.0, 32.0, 17.0, 14.0, 13.0, 8.0, 5.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.185546875, -2.1351776123046875, -2.084808349609375, -2.0344390869140625, -1.98406982421875, -1.9337005615234375, -1.883331298828125, -1.8329620361328125, -1.7825927734375, -1.7322235107421875, -1.681854248046875, -1.6314849853515625, -1.58111572265625, -1.5307464599609375, -1.480377197265625, -1.4300079345703125, -1.379638671875, -1.3292694091796875, -1.278900146484375, -1.2285308837890625, -1.17816162109375, -1.1277923583984375, -1.077423095703125, -1.0270538330078125, -0.9766845703125, -0.9263153076171875, -0.875946044921875, -0.8255767822265625, -0.77520751953125, -0.7248382568359375, -0.674468994140625, -0.6240997314453125, -0.57373046875, -0.5233612060546875, -0.472991943359375, -0.4226226806640625, -0.37225341796875, -0.3218841552734375, -0.271514892578125, -0.2211456298828125, -0.1707763671875, -0.1204071044921875, -0.070037841796875, -0.0196685791015625, 0.03070068359375, 0.0810699462890625, 0.131439208984375, 0.1818084716796875, 0.232177734375, 0.2825469970703125, 0.332916259765625, 0.3832855224609375, 0.43365478515625, 0.4840240478515625, 0.534393310546875, 0.5847625732421875, 0.6351318359375, 0.6855010986328125, 0.735870361328125, 0.7862396240234375, 0.83660888671875, 0.8869781494140625, 0.937347412109375, 0.9877166748046875, 1.0380859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 9.0, 5.0, 19.0, 11.0, 36.0, 44.0, 71.0, 109.0, 192.0, 296.0, 480.0, 900.0, 1733.0, 4454.0, 16596.0, 98496.0, 613986.0, 260254.0, 37232.0, 8168.0, 2659.0, 1217.0, 580.0, 359.0, 223.0, 147.0, 87.0, 75.0, 37.0, 25.0, 13.0, 14.0, 5.0, 5.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.9375, -4.816314697265625, -4.69512939453125, -4.573944091796875, -4.4527587890625, -4.331573486328125, -4.21038818359375, -4.089202880859375, -3.968017578125, -3.846832275390625, -3.72564697265625, -3.604461669921875, -3.4832763671875, -3.362091064453125, -3.24090576171875, -3.119720458984375, -2.99853515625, -2.877349853515625, -2.75616455078125, -2.634979248046875, -2.5137939453125, -2.392608642578125, -2.27142333984375, -2.150238037109375, -2.029052734375, -1.907867431640625, -1.78668212890625, -1.665496826171875, -1.5443115234375, -1.423126220703125, -1.30194091796875, -1.180755615234375, -1.0595703125, -0.938385009765625, -0.81719970703125, -0.696014404296875, -0.5748291015625, -0.453643798828125, -0.33245849609375, -0.211273193359375, -0.090087890625, 0.031097412109375, 0.15228271484375, 0.273468017578125, 0.3946533203125, 0.515838623046875, 0.63702392578125, 0.758209228515625, 0.87939453125, 1.000579833984375, 1.12176513671875, 1.242950439453125, 1.3641357421875, 1.485321044921875, 1.60650634765625, 1.727691650390625, 1.848876953125, 1.970062255859375, 2.09124755859375, 2.212432861328125, 2.3336181640625, 2.454803466796875, 2.57598876953125, 2.697174072265625, 2.818359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0, 9.0, 4.0, 12.0, 11.0, 17.0, 23.0, 32.0, 26.0, 22.0, 27.0, 41.0, 39.0, 37.0, 46.0, 47.0, 36.0, 54.0, 45.0, 44.0, 49.0, 44.0, 45.0, 43.0, 39.0, 24.0, 31.0, 24.0, 13.0, 20.0, 14.0, 10.0, 9.0, 19.0, 8.0, 9.0, 13.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.10546875, -4.948486328125, -4.79150390625, -4.634521484375, -4.4775390625, -4.320556640625, -4.16357421875, -4.006591796875, -3.849609375, -3.692626953125, -3.53564453125, -3.378662109375, -3.2216796875, -3.064697265625, -2.90771484375, -2.750732421875, -2.59375, -2.436767578125, -2.27978515625, -2.122802734375, -1.9658203125, -1.808837890625, -1.65185546875, -1.494873046875, -1.337890625, -1.180908203125, -1.02392578125, -0.866943359375, -0.7099609375, -0.552978515625, -0.39599609375, -0.239013671875, -0.08203125, 0.074951171875, 0.23193359375, 0.388916015625, 0.5458984375, 0.702880859375, 0.85986328125, 1.016845703125, 1.173828125, 1.330810546875, 1.48779296875, 1.644775390625, 1.8017578125, 1.958740234375, 2.11572265625, 2.272705078125, 2.4296875, 2.586669921875, 2.74365234375, 2.900634765625, 3.0576171875, 3.214599609375, 3.37158203125, 3.528564453125, 3.685546875, 3.842529296875, 3.99951171875, 4.156494140625, 4.3134765625, 4.470458984375, 4.62744140625, 4.784423828125, 4.94140625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 16.0, 26.0, 38.0, 75.0, 147.0, 409.0, 1316.0, 7854.0, 224487.0, 791732.0, 19228.0, 2239.0, 568.0, 201.0, 109.0, 48.0, 26.0, 18.0, 10.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.134033203125, -3.03955078125, -2.945068359375, -2.8505859375, -2.756103515625, -2.66162109375, -2.567138671875, -2.47265625, -2.378173828125, -2.28369140625, -2.189208984375, -2.0947265625, -2.000244140625, -1.90576171875, -1.811279296875, -1.716796875, -1.622314453125, -1.52783203125, -1.433349609375, -1.3388671875, -1.244384765625, -1.14990234375, -1.055419921875, -0.9609375, -0.866455078125, -0.77197265625, -0.677490234375, -0.5830078125, -0.488525390625, -0.39404296875, -0.299560546875, -0.205078125, -0.110595703125, -0.01611328125, 0.078369140625, 0.1728515625, 0.267333984375, 0.36181640625, 0.456298828125, 0.55078125, 0.645263671875, 0.73974609375, 0.834228515625, 0.9287109375, 1.023193359375, 1.11767578125, 1.212158203125, 1.306640625, 1.401123046875, 1.49560546875, 1.590087890625, 1.6845703125, 1.779052734375, 1.87353515625, 1.968017578125, 2.0625, 2.156982421875, 2.25146484375, 2.345947265625, 2.4404296875, 2.534912109375, 2.62939453125, 2.723876953125, 2.818359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 10.0, 10.0, 11.0, 26.0, 31.0, 45.0, 51.0, 84.0, 96.0, 122.0, 139.0, 107.0, 77.0, 67.0, 41.0, 26.0, 23.0, 12.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032973289489746094, -0.00031743571162223816, -0.0003051385283470154, -0.0002928413450717926, -0.0002805441617965698, -0.00026824697852134705, -0.00025594979524612427, -0.0002436526119709015, -0.0002313554286956787, -0.00021905824542045593, -0.00020676106214523315, -0.00019446387887001038, -0.0001821666955947876, -0.00016986951231956482, -0.00015757232904434204, -0.00014527514576911926, -0.00013297796249389648, -0.0001206807792186737, -0.00010838359594345093, -9.608641266822815e-05, -8.378922939300537e-05, -7.149204611778259e-05, -5.9194862842559814e-05, -4.6897679567337036e-05, -3.460049629211426e-05, -2.230331301689148e-05, -1.0006129741668701e-05, 2.291053533554077e-06, 1.4588236808776855e-05, 2.6885420083999634e-05, 3.918260335922241e-05, 5.147978663444519e-05, 6.377696990966797e-05, 7.607415318489075e-05, 8.837133646011353e-05, 0.0001006685197353363, 0.00011296570301055908, 0.00012526288628578186, 0.00013756006956100464, 0.00014985725283622742, 0.0001621544361114502, 0.00017445161938667297, 0.00018674880266189575, 0.00019904598593711853, 0.0002113431692123413, 0.0002236403524875641, 0.00023593753576278687, 0.00024823471903800964, 0.0002605319023132324, 0.0002728290855884552, 0.000285126268863678, 0.00029742345213890076, 0.00030972063541412354, 0.0003220178186893463, 0.0003343150019645691, 0.00034661218523979187, 0.00035890936851501465, 0.0003712065517902374, 0.0003835037350654602, 0.000395800918340683, 0.00040809810161590576, 0.00042039528489112854, 0.0004326924681663513, 0.0004449896514415741, 0.0004572868347167969]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 16.0, 22.0, 25.0, 33.0, 57.0, 60.0, 96.0, 154.0, 280.0, 493.0, 957.0, 2186.0, 6016.0, 23372.0, 148457.0, 667881.0, 162650.0, 24812.0, 6411.0, 2339.0, 973.0, 504.0, 278.0, 165.0, 97.0, 60.0, 32.0, 32.0, 17.0, 13.0, 11.0, 7.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25, -1.20904541015625, -1.1680908203125, -1.12713623046875, -1.086181640625, -1.04522705078125, -1.0042724609375, -0.96331787109375, -0.92236328125, -0.88140869140625, -0.8404541015625, -0.79949951171875, -0.758544921875, -0.71759033203125, -0.6766357421875, -0.63568115234375, -0.5947265625, -0.55377197265625, -0.5128173828125, -0.47186279296875, -0.430908203125, -0.38995361328125, -0.3489990234375, -0.30804443359375, -0.26708984375, -0.22613525390625, -0.1851806640625, -0.14422607421875, -0.103271484375, -0.06231689453125, -0.0213623046875, 0.01959228515625, 0.060546875, 0.10150146484375, 0.1424560546875, 0.18341064453125, 0.224365234375, 0.26531982421875, 0.3062744140625, 0.34722900390625, 0.38818359375, 0.42913818359375, 0.4700927734375, 0.51104736328125, 0.552001953125, 0.59295654296875, 0.6339111328125, 0.67486572265625, 0.7158203125, 0.75677490234375, 0.7977294921875, 0.83868408203125, 0.879638671875, 0.92059326171875, 0.9615478515625, 1.00250244140625, 1.04345703125, 1.08441162109375, 1.1253662109375, 1.16632080078125, 1.207275390625, 1.24822998046875, 1.2891845703125, 1.33013916015625, 1.37109375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 6.0, 7.0, 8.0, 15.0, 15.0, 28.0, 32.0, 43.0, 45.0, 51.0, 63.0, 87.0, 93.0, 75.0, 103.0, 71.0, 61.0, 44.0, 38.0, 33.0, 26.0, 18.0, 13.0, 8.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12109375, -1.0718994140625, -1.022705078125, -0.9735107421875, -0.92431640625, -0.8751220703125, -0.825927734375, -0.7767333984375, -0.7275390625, -0.6783447265625, -0.629150390625, -0.5799560546875, -0.53076171875, -0.4815673828125, -0.432373046875, -0.3831787109375, -0.333984375, -0.2847900390625, -0.235595703125, -0.1864013671875, -0.13720703125, -0.0880126953125, -0.038818359375, 0.0103759765625, 0.0595703125, 0.1087646484375, 0.157958984375, 0.2071533203125, 0.25634765625, 0.3055419921875, 0.354736328125, 0.4039306640625, 0.453125, 0.5023193359375, 0.551513671875, 0.6007080078125, 0.64990234375, 0.6990966796875, 0.748291015625, 0.7974853515625, 0.8466796875, 0.8958740234375, 0.945068359375, 0.9942626953125, 1.04345703125, 1.0926513671875, 1.141845703125, 1.1910400390625, 1.240234375, 1.2894287109375, 1.338623046875, 1.3878173828125, 1.43701171875, 1.4862060546875, 1.535400390625, 1.5845947265625, 1.6337890625, 1.6829833984375, 1.732177734375, 1.7813720703125, 1.83056640625, 1.8797607421875, 1.928955078125, 1.9781494140625, 2.02734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 16.0, 49.0, 126.0, 236.0, 284.0, 160.0, 77.0, 23.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.383113861083984, -23.91530990600586, -22.447507858276367, -20.979703903198242, -19.51190185546875, -18.044097900390625, -16.5762939453125, -15.108490943908691, -13.640687942504883, -12.172884941101074, -10.705081939697266, -9.23727798461914, -7.769474983215332, -6.301671981811523, -4.833868026733398, -3.36606502532959, -1.8982620239257812, -0.43045878410339355, 1.0373444557189941, 2.505147933959961, 3.9729509353637695, 5.440753936767578, 6.908557891845703, 8.376360893249512, 9.84416389465332, 11.311966896057129, 12.779769897460938, 14.247573852539062, 15.715376853942871, 17.18317985534668, 18.650983810424805, 20.118785858154297, 21.586585998535156, 23.05438995361328, 24.522192001342773, 25.9899959564209, 27.45779800415039, 28.925601959228516, 30.39340591430664, 31.861209869384766, 33.329010009765625, 34.79681396484375, 36.264617919921875, 37.732421875, 39.20022201538086, 40.668025970458984, 42.13582992553711, 43.603633880615234, 45.07143783569336, 46.539241790771484, 48.00704574584961, 49.47484588623047, 50.942649841308594, 52.41045379638672, 53.878257751464844, 55.34606170654297, 56.813865661621094, 58.28166961669922, 59.749473571777344, 61.21727752685547, 62.68507766723633, 64.15287780761719, 65.62068176269531, 67.08848571777344, 68.55628967285156]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 7.0, 9.0, 10.0, 16.0, 14.0, 22.0, 27.0, 30.0, 39.0, 47.0, 56.0, 34.0, 51.0, 56.0, 71.0, 68.0, 68.0, 58.0, 39.0, 46.0, 40.0, 27.0, 22.0, 26.0, 24.0, 20.0, 10.0, 8.0, 11.0, 6.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.10374641418457, -19.4123477935791, -18.720947265625, -18.02954864501953, -17.338150024414062, -16.646751403808594, -15.955351829528809, -15.263952255249023, -14.572553634643555, -13.881155014038086, -13.1897554397583, -12.498355865478516, -11.806957244873047, -11.115558624267578, -10.424159049987793, -9.732759475708008, -9.041360855102539, -8.34996223449707, -7.658562660217285, -6.967163562774658, -6.275764465332031, -5.584365367889404, -4.892966270446777, -4.20156717300415, -3.5101680755615234, -2.8187689781188965, -2.1273698806762695, -1.4359707832336426, -0.7445716857910156, -0.05317258834838867, 0.6382265090942383, 1.3296256065368652, 2.021026611328125, 2.712425708770752, 3.403824806213379, 4.095223903656006, 4.786623001098633, 5.47802209854126, 6.169421195983887, 6.860820293426514, 7.552219390869141, 8.24361801147461, 8.935017585754395, 9.62641716003418, 10.317815780639648, 11.009214401245117, 11.700613975524902, 12.392013549804688, 13.083412170410156, 13.774810791015625, 14.46621036529541, 15.157609939575195, 15.849008560180664, 16.540407180786133, 17.231807708740234, 17.923206329345703, 18.614604949951172, 19.30600357055664, 19.99740219116211, 20.68880271911621, 21.38020133972168, 22.07159996032715, 22.76300048828125, 23.45439910888672, 24.145797729492188]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 15.0, 11.0, 42.0, 71.0, 118.0, 263.0, 788.0, 3068.0, 17658.0, 298147.0, 3796124.0, 66874.0, 8112.0, 1827.0, 581.0, 239.0, 143.0, 61.0, 46.0, 23.0, 9.0, 13.0, 6.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.92578125, -4.800445556640625, -4.67510986328125, -4.549774169921875, -4.4244384765625, -4.299102783203125, -4.17376708984375, -4.048431396484375, -3.923095703125, -3.797760009765625, -3.67242431640625, -3.547088623046875, -3.4217529296875, -3.296417236328125, -3.17108154296875, -3.045745849609375, -2.92041015625, -2.795074462890625, -2.66973876953125, -2.544403076171875, -2.4190673828125, -2.293731689453125, -2.16839599609375, -2.043060302734375, -1.917724609375, -1.792388916015625, -1.66705322265625, -1.541717529296875, -1.4163818359375, -1.291046142578125, -1.16571044921875, -1.040374755859375, -0.9150390625, -0.789703369140625, -0.66436767578125, -0.539031982421875, -0.4136962890625, -0.288360595703125, -0.16302490234375, -0.037689208984375, 0.087646484375, 0.212982177734375, 0.33831787109375, 0.463653564453125, 0.5889892578125, 0.714324951171875, 0.83966064453125, 0.964996337890625, 1.09033203125, 1.215667724609375, 1.34100341796875, 1.466339111328125, 1.5916748046875, 1.717010498046875, 1.84234619140625, 1.967681884765625, 2.093017578125, 2.218353271484375, 2.34368896484375, 2.469024658203125, 2.5943603515625, 2.719696044921875, 2.84503173828125, 2.970367431640625, 3.095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 12.0, 13.0, 25.0, 22.0, 46.0, 66.0, 62.0, 75.0, 75.0, 73.0, 76.0, 80.0, 79.0, 71.0, 45.0, 45.0, 34.0, 35.0, 16.0, 13.0, 7.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.72998046875, -0.6826171875, -0.63525390625, -0.587890625, -0.54052734375, -0.4931640625, -0.44580078125, -0.3984375, -0.35107421875, -0.3037109375, -0.25634765625, -0.208984375, -0.16162109375, -0.1142578125, -0.06689453125, -0.01953125, 0.02783203125, 0.0751953125, 0.12255859375, 0.169921875, 0.21728515625, 0.2646484375, 0.31201171875, 0.359375, 0.40673828125, 0.4541015625, 0.50146484375, 0.548828125, 0.59619140625, 0.6435546875, 0.69091796875, 0.73828125, 0.78564453125, 0.8330078125, 0.88037109375, 0.927734375, 0.97509765625, 1.0224609375, 1.06982421875, 1.1171875, 1.16455078125, 1.2119140625, 1.25927734375, 1.306640625, 1.35400390625, 1.4013671875, 1.44873046875, 1.49609375, 1.54345703125, 1.5908203125, 1.63818359375, 1.685546875, 1.73291015625, 1.7802734375, 1.82763671875, 1.875, 1.92236328125, 1.9697265625, 2.01708984375, 2.064453125, 2.11181640625, 2.1591796875, 2.20654296875, 2.25390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 17.0, 19.0, 45.0, 57.0, 98.0, 227.0, 376.0, 895.0, 2244.0, 6189.0, 19964.0, 92019.0, 1591393.0, 2333780.0, 112368.0, 23228.0, 6989.0, 2459.0, 1011.0, 446.0, 199.0, 118.0, 52.0, 27.0, 26.0, 9.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.849334716796875, -2.76312255859375, -2.676910400390625, -2.5906982421875, -2.504486083984375, -2.41827392578125, -2.332061767578125, -2.245849609375, -2.159637451171875, -2.07342529296875, -1.987213134765625, -1.9010009765625, -1.814788818359375, -1.72857666015625, -1.642364501953125, -1.55615234375, -1.469940185546875, -1.38372802734375, -1.297515869140625, -1.2113037109375, -1.125091552734375, -1.03887939453125, -0.952667236328125, -0.866455078125, -0.780242919921875, -0.69403076171875, -0.607818603515625, -0.5216064453125, -0.435394287109375, -0.34918212890625, -0.262969970703125, -0.1767578125, -0.090545654296875, -0.00433349609375, 0.081878662109375, 0.1680908203125, 0.254302978515625, 0.34051513671875, 0.426727294921875, 0.512939453125, 0.599151611328125, 0.68536376953125, 0.771575927734375, 0.8577880859375, 0.944000244140625, 1.03021240234375, 1.116424560546875, 1.20263671875, 1.288848876953125, 1.37506103515625, 1.461273193359375, 1.5474853515625, 1.633697509765625, 1.71990966796875, 1.806121826171875, 1.892333984375, 1.978546142578125, 2.06475830078125, 2.150970458984375, 2.2371826171875, 2.323394775390625, 2.40960693359375, 2.495819091796875, 2.58203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 8.0, 9.0, 17.0, 17.0, 33.0, 43.0, 53.0, 104.0, 184.0, 316.0, 612.0, 992.0, 738.0, 378.0, 181.0, 112.0, 74.0, 57.0, 37.0, 22.0, 16.0, 12.0, 10.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.12109375, -3.035797119140625, -2.95050048828125, -2.865203857421875, -2.7799072265625, -2.694610595703125, -2.60931396484375, -2.524017333984375, -2.438720703125, -2.353424072265625, -2.26812744140625, -2.182830810546875, -2.0975341796875, -2.012237548828125, -1.92694091796875, -1.841644287109375, -1.75634765625, -1.671051025390625, -1.58575439453125, -1.500457763671875, -1.4151611328125, -1.329864501953125, -1.24456787109375, -1.159271240234375, -1.073974609375, -0.988677978515625, -0.90338134765625, -0.818084716796875, -0.7327880859375, -0.647491455078125, -0.56219482421875, -0.476898193359375, -0.3916015625, -0.306304931640625, -0.22100830078125, -0.135711669921875, -0.0504150390625, 0.034881591796875, 0.12017822265625, 0.205474853515625, 0.290771484375, 0.376068115234375, 0.46136474609375, 0.546661376953125, 0.6319580078125, 0.717254638671875, 0.80255126953125, 0.887847900390625, 0.97314453125, 1.058441162109375, 1.14373779296875, 1.229034423828125, 1.3143310546875, 1.399627685546875, 1.48492431640625, 1.570220947265625, 1.655517578125, 1.740814208984375, 1.82611083984375, 1.911407470703125, 1.9967041015625, 2.082000732421875, 2.16729736328125, 2.252593994140625, 2.337890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 15.0, 37.0, 80.0, 158.0, 218.0, 187.0, 139.0, 75.0, 37.0, 11.0, 15.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.884531021118164, -21.070728302001953, -20.256927490234375, -19.443124771118164, -18.629322052001953, -17.815521240234375, -17.001718521118164, -16.187915802001953, -15.374114990234375, -14.56031322479248, -13.746511459350586, -12.932708740234375, -12.11890697479248, -11.305105209350586, -10.491302490234375, -9.67750072479248, -8.863698959350586, -8.049897193908691, -7.236094951629639, -6.422292709350586, -5.608490943908691, -4.794689178466797, -3.980886936187744, -3.1670846939086914, -2.353282928466797, -1.5394809246063232, -0.7256789207458496, 0.08812308311462402, 0.9019250869750977, 1.7157268524169922, 2.529529094696045, 3.3433313369750977, 4.157131195068359, 4.970932960510254, 5.784735202789307, 6.598537445068359, 7.412339210510254, 8.226140975952148, 9.03994369506836, 9.853745460510254, 10.667547225952148, 11.481348991394043, 12.295150756835938, 13.108953475952148, 13.922755241394043, 14.736557006835938, 15.550359725952148, 16.36416244506836, 17.177963256835938, 17.99176597595215, 18.805566787719727, 19.619369506835938, 20.433170318603516, 21.246973037719727, 22.060775756835938, 22.874576568603516, 23.688379287719727, 24.502182006835938, 25.315982818603516, 26.129785537719727, 26.943588256835938, 27.757389068603516, 28.571191787719727, 29.384994506835938, 30.198795318603516]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 4.0, 2.0, 8.0, 9.0, 14.0, 17.0, 17.0, 14.0, 29.0, 22.0, 23.0, 35.0, 32.0, 34.0, 36.0, 34.0, 38.0, 55.0, 56.0, 38.0, 47.0, 45.0, 44.0, 46.0, 42.0, 44.0, 32.0, 22.0, 22.0, 25.0, 20.0, 16.0, 15.0, 14.0, 10.0, 4.0, 8.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.633718490600586, -11.298864364624023, -10.964011192321777, -10.629157066345215, -10.294302940368652, -9.959449768066406, -9.624595642089844, -9.289741516113281, -8.954887390136719, -8.620033264160156, -8.28518009185791, -7.950325965881348, -7.615471839904785, -7.280618190765381, -6.945764541625977, -6.610910415649414, -6.276057243347168, -5.941203594207764, -5.606349468231201, -5.271495819091797, -4.936641693115234, -4.60178804397583, -4.266934394836426, -3.9320805072784424, -3.597226619720459, -3.2623727321624756, -2.927518844604492, -2.592665195465088, -2.2578113079071045, -1.922957420349121, -1.5881037712097168, -1.2532498836517334, -0.91839599609375, -0.5835421681404114, -0.24868834018707275, 0.0861654281616211, 0.4210193157196045, 0.7558732032775879, 1.0907268524169922, 1.4255807399749756, 1.760434627532959, 2.0952885150909424, 2.430142402648926, 2.76499605178833, 3.0998499393463135, 3.434703826904297, 3.769557476043701, 4.1044111251831055, 4.439265251159668, 4.774118900299072, 5.108973026275635, 5.443826675415039, 5.778680801391602, 6.113534450531006, 6.44838809967041, 6.783242225646973, 7.118095874786377, 7.452949523925781, 7.787803649902344, 8.122657775878906, 8.457510948181152, 8.792365074157715, 9.127218246459961, 9.462072372436523, 9.796926498413086]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 12.0, 26.0, 31.0, 70.0, 92.0, 126.0, 237.0, 368.0, 652.0, 1033.0, 1917.0, 3705.0, 7325.0, 15285.0, 33969.0, 81245.0, 200261.0, 335451.0, 211246.0, 86404.0, 36460.0, 16081.0, 7810.0, 3880.0, 2034.0, 1120.0, 647.0, 412.0, 232.0, 145.0, 107.0, 57.0, 39.0, 22.0, 12.0, 18.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.93359375, -1.879180908203125, -1.82476806640625, -1.770355224609375, -1.7159423828125, -1.661529541015625, -1.60711669921875, -1.552703857421875, -1.498291015625, -1.443878173828125, -1.38946533203125, -1.335052490234375, -1.2806396484375, -1.226226806640625, -1.17181396484375, -1.117401123046875, -1.06298828125, -1.008575439453125, -0.95416259765625, -0.899749755859375, -0.8453369140625, -0.790924072265625, -0.73651123046875, -0.682098388671875, -0.627685546875, -0.573272705078125, -0.51885986328125, -0.464447021484375, -0.4100341796875, -0.355621337890625, -0.30120849609375, -0.246795654296875, -0.1923828125, -0.137969970703125, -0.08355712890625, -0.029144287109375, 0.0252685546875, 0.079681396484375, 0.13409423828125, 0.188507080078125, 0.242919921875, 0.297332763671875, 0.35174560546875, 0.406158447265625, 0.4605712890625, 0.514984130859375, 0.56939697265625, 0.623809814453125, 0.67822265625, 0.732635498046875, 0.78704833984375, 0.841461181640625, 0.8958740234375, 0.950286865234375, 1.00469970703125, 1.059112548828125, 1.113525390625, 1.167938232421875, 1.22235107421875, 1.276763916015625, 1.3311767578125, 1.385589599609375, 1.44000244140625, 1.494415283203125, 1.548828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 11.0, 11.0, 16.0, 21.0, 14.0, 29.0, 27.0, 37.0, 34.0, 40.0, 37.0, 39.0, 56.0, 52.0, 43.0, 43.0, 55.0, 39.0, 48.0, 36.0, 47.0, 34.0, 36.0, 27.0, 21.0, 25.0, 14.0, 15.0, 18.0, 12.0, 9.0, 4.0, 2.0, 6.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.7596206665039062, -0.7296905517578125, -0.6997604370117188, -0.669830322265625, -0.6399002075195312, -0.6099700927734375, -0.5800399780273438, -0.55010986328125, -0.5201797485351562, -0.4902496337890625, -0.46031951904296875, -0.430389404296875, -0.40045928955078125, -0.3705291748046875, -0.34059906005859375, -0.3106689453125, -0.28073883056640625, -0.2508087158203125, -0.22087860107421875, -0.190948486328125, -0.16101837158203125, -0.1310882568359375, -0.10115814208984375, -0.07122802734375, -0.04129791259765625, -0.0113677978515625, 0.01856231689453125, 0.048492431640625, 0.07842254638671875, 0.1083526611328125, 0.13828277587890625, 0.168212890625, 0.19814300537109375, 0.2280731201171875, 0.25800323486328125, 0.287933349609375, 0.31786346435546875, 0.3477935791015625, 0.37772369384765625, 0.40765380859375, 0.43758392333984375, 0.4675140380859375, 0.49744415283203125, 0.527374267578125, 0.5573043823242188, 0.5872344970703125, 0.6171646118164062, 0.6470947265625, 0.6770248413085938, 0.7069549560546875, 0.7368850708007812, 0.766815185546875, 0.7967453002929688, 0.8266754150390625, 0.8566055297851562, 0.88653564453125, 0.9164657592773438, 0.9463958740234375, 0.9763259887695312, 1.006256103515625, 1.0361862182617188, 1.0661163330078125, 1.0960464477539062, 1.1259765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 12.0, 26.0, 30.0, 40.0, 69.0, 129.0, 194.0, 318.0, 602.0, 1172.0, 3033.0, 10941.0, 62688.0, 549819.0, 360921.0, 45024.0, 8691.0, 2532.0, 1041.0, 510.0, 291.0, 159.0, 89.0, 74.0, 47.0, 28.0, 14.0, 14.0, 14.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.82421875, -4.70025634765625, -4.5762939453125, -4.45233154296875, -4.328369140625, -4.20440673828125, -4.0804443359375, -3.95648193359375, -3.83251953125, -3.70855712890625, -3.5845947265625, -3.46063232421875, -3.336669921875, -3.21270751953125, -3.0887451171875, -2.96478271484375, -2.8408203125, -2.71685791015625, -2.5928955078125, -2.46893310546875, -2.344970703125, -2.22100830078125, -2.0970458984375, -1.97308349609375, -1.84912109375, -1.72515869140625, -1.6011962890625, -1.47723388671875, -1.353271484375, -1.22930908203125, -1.1053466796875, -0.98138427734375, -0.857421875, -0.73345947265625, -0.6094970703125, -0.48553466796875, -0.361572265625, -0.23760986328125, -0.1136474609375, 0.01031494140625, 0.13427734375, 0.25823974609375, 0.3822021484375, 0.50616455078125, 0.630126953125, 0.75408935546875, 0.8780517578125, 1.00201416015625, 1.1259765625, 1.24993896484375, 1.3739013671875, 1.49786376953125, 1.621826171875, 1.74578857421875, 1.8697509765625, 1.99371337890625, 2.11767578125, 2.24163818359375, 2.3656005859375, 2.48956298828125, 2.613525390625, 2.73748779296875, 2.8614501953125, 2.98541259765625, 3.109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 9.0, 10.0, 12.0, 15.0, 10.0, 16.0, 22.0, 22.0, 27.0, 33.0, 42.0, 36.0, 31.0, 34.0, 36.0, 44.0, 41.0, 41.0, 54.0, 44.0, 30.0, 56.0, 43.0, 38.0, 33.0, 26.0, 25.0, 26.0, 24.0, 14.0, 25.0, 17.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.0234375, -3.9017333984375, -3.780029296875, -3.6583251953125, -3.53662109375, -3.4149169921875, -3.293212890625, -3.1715087890625, -3.0498046875, -2.9281005859375, -2.806396484375, -2.6846923828125, -2.56298828125, -2.4412841796875, -2.319580078125, -2.1978759765625, -2.076171875, -1.9544677734375, -1.832763671875, -1.7110595703125, -1.58935546875, -1.4676513671875, -1.345947265625, -1.2242431640625, -1.1025390625, -0.9808349609375, -0.859130859375, -0.7374267578125, -0.61572265625, -0.4940185546875, -0.372314453125, -0.2506103515625, -0.12890625, -0.0072021484375, 0.114501953125, 0.2362060546875, 0.35791015625, 0.4796142578125, 0.601318359375, 0.7230224609375, 0.8447265625, 0.9664306640625, 1.088134765625, 1.2098388671875, 1.33154296875, 1.4532470703125, 1.574951171875, 1.6966552734375, 1.818359375, 1.9400634765625, 2.061767578125, 2.1834716796875, 2.30517578125, 2.4268798828125, 2.548583984375, 2.6702880859375, 2.7919921875, 2.9136962890625, 3.035400390625, 3.1571044921875, 3.27880859375, 3.4005126953125, 3.522216796875, 3.6439208984375, 3.765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 14.0, 13.0, 20.0, 27.0, 66.0, 97.0, 165.0, 478.0, 1479.0, 9175.0, 255257.0, 757519.0, 20756.0, 2326.0, 633.0, 236.0, 121.0, 60.0, 35.0, 13.0, 13.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.625, -2.543365478515625, -2.46173095703125, -2.380096435546875, -2.2984619140625, -2.216827392578125, -2.13519287109375, -2.053558349609375, -1.971923828125, -1.890289306640625, -1.80865478515625, -1.727020263671875, -1.6453857421875, -1.563751220703125, -1.48211669921875, -1.400482177734375, -1.31884765625, -1.237213134765625, -1.15557861328125, -1.073944091796875, -0.9923095703125, -0.910675048828125, -0.82904052734375, -0.747406005859375, -0.665771484375, -0.584136962890625, -0.50250244140625, -0.420867919921875, -0.3392333984375, -0.257598876953125, -0.17596435546875, -0.094329833984375, -0.0126953125, 0.068939208984375, 0.15057373046875, 0.232208251953125, 0.3138427734375, 0.395477294921875, 0.47711181640625, 0.558746337890625, 0.640380859375, 0.722015380859375, 0.80364990234375, 0.885284423828125, 0.9669189453125, 1.048553466796875, 1.13018798828125, 1.211822509765625, 1.29345703125, 1.375091552734375, 1.45672607421875, 1.538360595703125, 1.6199951171875, 1.701629638671875, 1.78326416015625, 1.864898681640625, 1.946533203125, 2.028167724609375, 2.10980224609375, 2.191436767578125, 2.2730712890625, 2.354705810546875, 2.43634033203125, 2.517974853515625, 2.599609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 9.0, 13.0, 9.0, 13.0, 21.0, 27.0, 27.0, 41.0, 49.0, 52.0, 64.0, 79.0, 94.0, 76.0, 77.0, 63.0, 49.0, 47.0, 31.0, 30.0, 18.0, 24.0, 17.0, 9.0, 11.0, 9.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018310546875, -0.00017629563808441162, -0.00016948580741882324, -0.00016267597675323486, -0.00015586614608764648, -0.0001490563154220581, -0.00014224648475646973, -0.00013543665409088135, -0.00012862682342529297, -0.00012181699275970459, -0.00011500716209411621, -0.00010819733142852783, -0.00010138750076293945, -9.457767009735107e-05, -8.77678394317627e-05, -8.095800876617432e-05, -7.414817810058594e-05, -6.733834743499756e-05, -6.052851676940918e-05, -5.37186861038208e-05, -4.690885543823242e-05, -4.009902477264404e-05, -3.3289194107055664e-05, -2.6479363441467285e-05, -1.9669532775878906e-05, -1.2859702110290527e-05, -6.0498714447021484e-06, 7.599592208862305e-07, 7.569789886474609e-06, 1.4379620552062988e-05, 2.1189451217651367e-05, 2.7999281883239746e-05, 3.4809112548828125e-05, 4.1618943214416504e-05, 4.842877388000488e-05, 5.523860454559326e-05, 6.204843521118164e-05, 6.885826587677002e-05, 7.56680965423584e-05, 8.247792720794678e-05, 8.928775787353516e-05, 9.609758853912354e-05, 0.00010290741920471191, 0.00010971724987030029, 0.00011652708053588867, 0.00012333691120147705, 0.00013014674186706543, 0.0001369565725326538, 0.0001437664031982422, 0.00015057623386383057, 0.00015738606452941895, 0.00016419589519500732, 0.0001710057258605957, 0.00017781555652618408, 0.00018462538719177246, 0.00019143521785736084, 0.00019824504852294922, 0.0002050548791885376, 0.00021186470985412598, 0.00021867454051971436, 0.00022548437118530273, 0.0002322942018508911, 0.0002391040325164795, 0.00024591386318206787, 0.00025272369384765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 1.0, 3.0, 3.0, 12.0, 17.0, 24.0, 39.0, 54.0, 96.0, 171.0, 371.0, 771.0, 2300.0, 9863.0, 104569.0, 798472.0, 116897.0, 10747.0, 2525.0, 829.0, 374.0, 164.0, 98.0, 69.0, 27.0, 20.0, 10.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.380859375, -1.326751708984375, -1.27264404296875, -1.218536376953125, -1.1644287109375, -1.110321044921875, -1.05621337890625, -1.002105712890625, -0.947998046875, -0.893890380859375, -0.83978271484375, -0.785675048828125, -0.7315673828125, -0.677459716796875, -0.62335205078125, -0.569244384765625, -0.51513671875, -0.461029052734375, -0.40692138671875, -0.352813720703125, -0.2987060546875, -0.244598388671875, -0.19049072265625, -0.136383056640625, -0.082275390625, -0.028167724609375, 0.02593994140625, 0.080047607421875, 0.1341552734375, 0.188262939453125, 0.24237060546875, 0.296478271484375, 0.3505859375, 0.404693603515625, 0.45880126953125, 0.512908935546875, 0.5670166015625, 0.621124267578125, 0.67523193359375, 0.729339599609375, 0.783447265625, 0.837554931640625, 0.89166259765625, 0.945770263671875, 0.9998779296875, 1.053985595703125, 1.10809326171875, 1.162200927734375, 1.21630859375, 1.270416259765625, 1.32452392578125, 1.378631591796875, 1.4327392578125, 1.486846923828125, 1.54095458984375, 1.595062255859375, 1.649169921875, 1.703277587890625, 1.75738525390625, 1.811492919921875, 1.8656005859375, 1.919708251953125, 1.97381591796875, 2.027923583984375, 2.08203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 12.0, 12.0, 23.0, 35.0, 57.0, 65.0, 82.0, 124.0, 106.0, 126.0, 84.0, 77.0, 66.0, 31.0, 31.0, 19.0, 11.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.205169677734375, -1.15252685546875, -1.099884033203125, -1.0472412109375, -0.994598388671875, -0.94195556640625, -0.889312744140625, -0.836669921875, -0.784027099609375, -0.73138427734375, -0.678741455078125, -0.6260986328125, -0.573455810546875, -0.52081298828125, -0.468170166015625, -0.41552734375, -0.362884521484375, -0.31024169921875, -0.257598876953125, -0.2049560546875, -0.152313232421875, -0.09967041015625, -0.047027587890625, 0.005615234375, 0.058258056640625, 0.11090087890625, 0.163543701171875, 0.2161865234375, 0.268829345703125, 0.32147216796875, 0.374114990234375, 0.4267578125, 0.479400634765625, 0.53204345703125, 0.584686279296875, 0.6373291015625, 0.689971923828125, 0.74261474609375, 0.795257568359375, 0.847900390625, 0.900543212890625, 0.95318603515625, 1.005828857421875, 1.0584716796875, 1.111114501953125, 1.16375732421875, 1.216400146484375, 1.26904296875, 1.321685791015625, 1.37432861328125, 1.426971435546875, 1.4796142578125, 1.532257080078125, 1.58489990234375, 1.637542724609375, 1.690185546875, 1.742828369140625, 1.79547119140625, 1.848114013671875, 1.9007568359375, 1.953399658203125, 2.00604248046875, 2.058685302734375, 2.111328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 4.0, 10.0, 19.0, 34.0, 90.0, 125.0, 181.0, 217.0, 139.0, 89.0, 42.0, 21.0, 15.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.67139434814453, -25.722217559814453, -24.773040771484375, -23.823863983154297, -22.87468719482422, -21.92551040649414, -20.976333618164062, -20.027156829833984, -19.077980041503906, -18.128803253173828, -17.17962646484375, -16.230449676513672, -15.281272888183594, -14.332096099853516, -13.382919311523438, -12.43374252319336, -11.484566688537598, -10.53538990020752, -9.586213111877441, -8.637036323547363, -7.687859535217285, -6.738683223724365, -5.789506435394287, -4.840329647064209, -3.891152858734131, -2.9419760704040527, -1.9927994012832642, -1.0436227321624756, -0.09444594383239746, 0.8547306060791016, 1.8039073944091797, 2.753084182739258, 3.702260971069336, 4.651437759399414, 5.600614547729492, 6.54979133605957, 7.498968124389648, 8.448144912719727, 9.397321701049805, 10.346498489379883, 11.295675277709961, 12.244852066040039, 13.194028854370117, 14.143205642700195, 15.092382431030273, 16.04155921936035, 16.99073600769043, 17.939912796020508, 18.889087677001953, 19.83826446533203, 20.78744125366211, 21.736618041992188, 22.685794830322266, 23.634971618652344, 24.584148406982422, 25.5333251953125, 26.482501983642578, 27.431678771972656, 28.380855560302734, 29.330032348632812, 30.27920913696289, 31.22838592529297, 32.17756271362305, 33.126739501953125, 34.0759162902832]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 11.0, 11.0, 17.0, 23.0, 21.0, 23.0, 38.0, 35.0, 38.0, 41.0, 50.0, 52.0, 58.0, 70.0, 73.0, 47.0, 45.0, 36.0, 48.0, 36.0, 36.0, 30.0, 26.0, 17.0, 19.0, 16.0, 9.0, 10.0, 6.0, 2.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.40782356262207, -18.776329040527344, -18.144834518432617, -17.51333999633789, -16.881847381591797, -16.25035285949707, -15.618858337402344, -14.987363815307617, -14.35586929321289, -13.724374771118164, -13.092881202697754, -12.461386680603027, -11.8298921585083, -11.19839859008789, -10.566904067993164, -9.935409545898438, -9.303915977478027, -8.6724214553833, -8.04092788696289, -7.409433364868164, -6.7779388427734375, -6.146444797515869, -5.514950752258301, -4.883456230163574, -4.251962184906006, -3.6204679012298584, -2.988973617553711, -2.3574795722961426, -1.7259852886199951, -1.0944910049438477, -0.4629969596862793, 0.16849756240844727, 0.7999916076660156, 1.431485891342163, 2.0629801750183105, 2.694474220275879, 3.3259685039520264, 3.957462787628174, 4.588956832885742, 5.220451354980469, 5.851945400238037, 6.4834394454956055, 7.114933967590332, 7.7464280128479, 8.377922058105469, 9.009416580200195, 9.640911102294922, 10.272405624389648, 10.903899192810059, 11.535393714904785, 12.166887283325195, 12.798381805419922, 13.429876327514648, 14.061370849609375, 14.692864418029785, 15.324358940124512, 15.955852508544922, 16.58734703063965, 17.218841552734375, 17.85033416748047, 18.481828689575195, 19.113323211669922, 19.74481773376465, 20.376312255859375, 21.0078067779541]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 14.0, 42.0, 70.0, 179.0, 353.0, 754.0, 1684.0, 4729.0, 16630.0, 82741.0, 897752.0, 2844768.0, 293385.0, 38509.0, 8663.0, 2440.0, 801.0, 337.0, 147.0, 84.0, 51.0, 29.0, 19.0, 23.0, 14.0, 7.0, 11.0, 6.0, 4.0, 6.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3024749755859375, -1.246551513671875, -1.1906280517578125, -1.13470458984375, -1.0787811279296875, -1.022857666015625, -0.9669342041015625, -0.9110107421875, -0.8550872802734375, -0.799163818359375, -0.7432403564453125, -0.68731689453125, -0.6313934326171875, -0.575469970703125, -0.5195465087890625, -0.463623046875, -0.4076995849609375, -0.351776123046875, -0.2958526611328125, -0.23992919921875, -0.1840057373046875, -0.128082275390625, -0.0721588134765625, -0.0162353515625, 0.0396881103515625, 0.095611572265625, 0.1515350341796875, 0.20745849609375, 0.2633819580078125, 0.319305419921875, 0.3752288818359375, 0.43115234375, 0.4870758056640625, 0.542999267578125, 0.5989227294921875, 0.65484619140625, 0.7107696533203125, 0.766693115234375, 0.8226165771484375, 0.8785400390625, 0.9344635009765625, 0.990386962890625, 1.0463104248046875, 1.10223388671875, 1.1581573486328125, 1.214080810546875, 1.2700042724609375, 1.325927734375, 1.3818511962890625, 1.437774658203125, 1.4936981201171875, 1.54962158203125, 1.6055450439453125, 1.661468505859375, 1.7173919677734375, 1.7733154296875, 1.8292388916015625, 1.885162353515625, 1.9410858154296875, 1.99700927734375, 2.0529327392578125, 2.108856201171875, 2.1647796630859375, 2.220703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 6.0, 14.0, 25.0, 39.0, 62.0, 90.0, 94.0, 107.0, 133.0, 118.0, 100.0, 74.0, 45.0, 48.0, 23.0, 19.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8720703125, -0.8027801513671875, -0.733489990234375, -0.6641998291015625, -0.59490966796875, -0.5256195068359375, -0.456329345703125, -0.3870391845703125, -0.3177490234375, -0.2484588623046875, -0.179168701171875, -0.1098785400390625, -0.04058837890625, 0.0287017822265625, 0.097991943359375, 0.1672821044921875, 0.236572265625, 0.3058624267578125, 0.375152587890625, 0.4444427490234375, 0.51373291015625, 0.5830230712890625, 0.652313232421875, 0.7216033935546875, 0.7908935546875, 0.8601837158203125, 0.929473876953125, 0.9987640380859375, 1.06805419921875, 1.1373443603515625, 1.206634521484375, 1.2759246826171875, 1.34521484375, 1.4145050048828125, 1.483795166015625, 1.5530853271484375, 1.62237548828125, 1.6916656494140625, 1.760955810546875, 1.8302459716796875, 1.8995361328125, 1.9688262939453125, 2.038116455078125, 2.1074066162109375, 2.17669677734375, 2.2459869384765625, 2.315277099609375, 2.3845672607421875, 2.453857421875, 2.5231475830078125, 2.592437744140625, 2.6617279052734375, 2.73101806640625, 2.8003082275390625, 2.869598388671875, 2.9388885498046875, 3.0081787109375, 3.0774688720703125, 3.146759033203125, 3.2160491943359375, 3.28533935546875, 3.3546295166015625, 3.423919677734375, 3.4932098388671875, 3.5625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 12.0, 17.0, 19.0, 24.0, 27.0, 47.0, 74.0, 112.0, 177.0, 313.0, 546.0, 1276.0, 3117.0, 8342.0, 25436.0, 110009.0, 1156827.0, 2635151.0, 199534.0, 37137.0, 9859.0, 3422.0, 1343.0, 648.0, 315.0, 175.0, 103.0, 62.0, 53.0, 32.0, 18.0, 21.0, 9.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.462890625, -2.394775390625, -2.32666015625, -2.258544921875, -2.1904296875, -2.122314453125, -2.05419921875, -1.986083984375, -1.91796875, -1.849853515625, -1.78173828125, -1.713623046875, -1.6455078125, -1.577392578125, -1.50927734375, -1.441162109375, -1.373046875, -1.304931640625, -1.23681640625, -1.168701171875, -1.1005859375, -1.032470703125, -0.96435546875, -0.896240234375, -0.828125, -0.760009765625, -0.69189453125, -0.623779296875, -0.5556640625, -0.487548828125, -0.41943359375, -0.351318359375, -0.283203125, -0.215087890625, -0.14697265625, -0.078857421875, -0.0107421875, 0.057373046875, 0.12548828125, 0.193603515625, 0.26171875, 0.329833984375, 0.39794921875, 0.466064453125, 0.5341796875, 0.602294921875, 0.67041015625, 0.738525390625, 0.806640625, 0.874755859375, 0.94287109375, 1.010986328125, 1.0791015625, 1.147216796875, 1.21533203125, 1.283447265625, 1.3515625, 1.419677734375, 1.48779296875, 1.555908203125, 1.6240234375, 1.692138671875, 1.76025390625, 1.828369140625, 1.896484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 1.0, 8.0, 2.0, 3.0, 7.0, 6.0, 15.0, 9.0, 14.0, 16.0, 16.0, 18.0, 24.0, 41.0, 68.0, 83.0, 130.0, 183.0, 250.0, 352.0, 592.0, 613.0, 517.0, 340.0, 224.0, 148.0, 94.0, 80.0, 50.0, 45.0, 18.0, 29.0, 24.0, 13.0, 11.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.982696533203125, -1.91265869140625, -1.842620849609375, -1.7725830078125, -1.702545166015625, -1.63250732421875, -1.562469482421875, -1.492431640625, -1.422393798828125, -1.35235595703125, -1.282318115234375, -1.2122802734375, -1.142242431640625, -1.07220458984375, -1.002166748046875, -0.93212890625, -0.862091064453125, -0.79205322265625, -0.722015380859375, -0.6519775390625, -0.581939697265625, -0.51190185546875, -0.441864013671875, -0.371826171875, -0.301788330078125, -0.23175048828125, -0.161712646484375, -0.0916748046875, -0.021636962890625, 0.04840087890625, 0.118438720703125, 0.1884765625, 0.258514404296875, 0.32855224609375, 0.398590087890625, 0.4686279296875, 0.538665771484375, 0.60870361328125, 0.678741455078125, 0.748779296875, 0.818817138671875, 0.88885498046875, 0.958892822265625, 1.0289306640625, 1.098968505859375, 1.16900634765625, 1.239044189453125, 1.30908203125, 1.379119873046875, 1.44915771484375, 1.519195556640625, 1.5892333984375, 1.659271240234375, 1.72930908203125, 1.799346923828125, 1.869384765625, 1.939422607421875, 2.00946044921875, 2.079498291015625, 2.1495361328125, 2.219573974609375, 2.28961181640625, 2.359649658203125, 2.4296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 19.0, 45.0, 117.0, 262.0, 327.0, 149.0, 45.0, 14.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65392303466797, -38.202369689941406, -36.75081253051758, -35.29925537109375, -33.84770202636719, -32.396148681640625, -30.944591522216797, -29.4930362701416, -28.041481018066406, -26.58992576599121, -25.138370513916016, -23.68681526184082, -22.235260009765625, -20.78370475769043, -19.332149505615234, -17.88059425354004, -16.429039001464844, -14.977483749389648, -13.525928497314453, -12.074373245239258, -10.622817993164062, -9.171262741088867, -7.719707489013672, -6.268152236938477, -4.816596984863281, -3.365041732788086, -1.9134864807128906, -0.4619312286376953, 0.9896240234375, 2.4411792755126953, 3.8927345275878906, 5.344289779663086, 6.795848846435547, 8.247404098510742, 9.698959350585938, 11.150514602661133, 12.602069854736328, 14.053625106811523, 15.505180358886719, 16.956735610961914, 18.40829086303711, 19.859846115112305, 21.3114013671875, 22.762956619262695, 24.21451187133789, 25.666067123413086, 27.11762237548828, 28.569177627563477, 30.020732879638672, 31.472288131713867, 32.92384338378906, 34.375396728515625, 35.82695388793945, 37.27851104736328, 38.730064392089844, 40.181617736816406, 41.633174896240234, 43.08473205566406, 44.536285400390625, 45.98783874511719, 47.439395904541016, 48.890953063964844, 50.342506408691406, 51.79405975341797, 53.2456169128418]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 19.0, 23.0, 17.0, 21.0, 28.0, 35.0, 41.0, 48.0, 49.0, 64.0, 85.0, 63.0, 78.0, 62.0, 51.0, 42.0, 61.0, 49.0, 37.0, 29.0, 18.0, 20.0, 9.0, 11.0, 7.0, 6.0, 2.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-22.36190414428711, -21.82243537902832, -21.28296661376953, -20.743497848510742, -20.204029083251953, -19.664562225341797, -19.125093460083008, -18.58562469482422, -18.04615592956543, -17.50668716430664, -16.96721839904785, -16.427749633789062, -15.88828182220459, -15.3488130569458, -14.809345245361328, -14.269876480102539, -13.73040771484375, -13.190938949584961, -12.651470184326172, -12.1120023727417, -11.57253360748291, -11.033064842224121, -10.493597030639648, -9.95412826538086, -9.41465950012207, -8.875190734863281, -8.335721969604492, -7.7962541580200195, -7.2567853927612305, -6.717316627502441, -6.1778483390808105, -5.63838005065918, -5.098913192749023, -4.559444427490234, -4.0199761390686035, -3.4805076122283936, -2.9410390853881836, -2.4015705585479736, -1.8621020317077637, -1.3226335048675537, -0.7831649780273438, -0.2436964511871338, 0.29577207565307617, 0.8352406024932861, 1.374709129333496, 1.914177656173706, 2.453646183013916, 2.993114709854126, 3.532583236694336, 4.072052001953125, 4.611520290374756, 5.150988578796387, 5.690457344055176, 6.229926109313965, 6.769394397735596, 7.308862686157227, 7.848331451416016, 8.387800216674805, 8.927268981933594, 9.466736793518066, 10.006205558776855, 10.545674324035645, 11.085142135620117, 11.624610900878906, 12.164079666137695]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 11.0, 16.0, 41.0, 54.0, 75.0, 145.0, 228.0, 527.0, 952.0, 2204.0, 4849.0, 11866.0, 28482.0, 68983.0, 154509.0, 275902.0, 260023.0, 136617.0, 59816.0, 25008.0, 10130.0, 4415.0, 1885.0, 845.0, 416.0, 218.0, 141.0, 71.0, 46.0, 25.0, 20.0, 15.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1875, -1.1433868408203125, -1.099273681640625, -1.0551605224609375, -1.01104736328125, -0.9669342041015625, -0.922821044921875, -0.8787078857421875, -0.8345947265625, -0.7904815673828125, -0.746368408203125, -0.7022552490234375, -0.65814208984375, -0.6140289306640625, -0.569915771484375, -0.5258026123046875, -0.481689453125, -0.4375762939453125, -0.393463134765625, -0.3493499755859375, -0.30523681640625, -0.2611236572265625, -0.217010498046875, -0.1728973388671875, -0.1287841796875, -0.0846710205078125, -0.040557861328125, 0.0035552978515625, 0.04766845703125, 0.0917816162109375, 0.135894775390625, 0.1800079345703125, 0.22412109375, 0.2682342529296875, 0.312347412109375, 0.3564605712890625, 0.40057373046875, 0.4446868896484375, 0.488800048828125, 0.5329132080078125, 0.5770263671875, 0.6211395263671875, 0.665252685546875, 0.7093658447265625, 0.75347900390625, 0.7975921630859375, 0.841705322265625, 0.8858184814453125, 0.929931640625, 0.9740447998046875, 1.018157958984375, 1.0622711181640625, 1.10638427734375, 1.1504974365234375, 1.194610595703125, 1.2387237548828125, 1.2828369140625, 1.3269500732421875, 1.371063232421875, 1.4151763916015625, 1.45928955078125, 1.5034027099609375, 1.547515869140625, 1.5916290283203125, 1.6357421875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 6.0, 14.0, 19.0, 18.0, 30.0, 25.0, 38.0, 48.0, 49.0, 51.0, 47.0, 46.0, 63.0, 65.0, 54.0, 64.0, 53.0, 46.0, 41.0, 42.0, 27.0, 35.0, 22.0, 26.0, 18.0, 19.0, 6.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79736328125, -0.7635116577148438, -0.7296600341796875, -0.6958084106445312, -0.661956787109375, -0.6281051635742188, -0.5942535400390625, -0.5604019165039062, -0.52655029296875, -0.49269866943359375, -0.4588470458984375, -0.42499542236328125, -0.391143798828125, -0.35729217529296875, -0.3234405517578125, -0.28958892822265625, -0.2557373046875, -0.22188568115234375, -0.1880340576171875, -0.15418243408203125, -0.120330810546875, -0.08647918701171875, -0.0526275634765625, -0.01877593994140625, 0.01507568359375, 0.04892730712890625, 0.0827789306640625, 0.11663055419921875, 0.150482177734375, 0.18433380126953125, 0.2181854248046875, 0.25203704833984375, 0.285888671875, 0.31974029541015625, 0.3535919189453125, 0.38744354248046875, 0.421295166015625, 0.45514678955078125, 0.4889984130859375, 0.5228500366210938, 0.55670166015625, 0.5905532836914062, 0.6244049072265625, 0.6582565307617188, 0.692108154296875, 0.7259597778320312, 0.7598114013671875, 0.7936630249023438, 0.8275146484375, 0.8613662719726562, 0.8952178955078125, 0.9290695190429688, 0.962921142578125, 0.9967727661132812, 1.0306243896484375, 1.0644760131835938, 1.09832763671875, 1.1321792602539062, 1.1660308837890625, 1.1998825073242188, 1.233734130859375, 1.2675857543945312, 1.3014373779296875, 1.3352890014648438, 1.369140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 7.0, 8.0, 13.0, 28.0, 20.0, 27.0, 35.0, 58.0, 81.0, 94.0, 164.0, 208.0, 335.0, 451.0, 683.0, 1162.0, 2367.0, 6113.0, 25368.0, 172627.0, 667545.0, 138960.0, 21407.0, 5479.0, 2197.0, 1092.0, 646.0, 393.0, 277.0, 197.0, 121.0, 106.0, 69.0, 42.0, 49.0, 26.0, 30.0, 15.0, 11.0, 8.0, 11.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.650390625, -2.557220458984375, -2.46405029296875, -2.370880126953125, -2.2777099609375, -2.184539794921875, -2.09136962890625, -1.998199462890625, -1.905029296875, -1.811859130859375, -1.71868896484375, -1.625518798828125, -1.5323486328125, -1.439178466796875, -1.34600830078125, -1.252838134765625, -1.15966796875, -1.066497802734375, -0.97332763671875, -0.880157470703125, -0.7869873046875, -0.693817138671875, -0.60064697265625, -0.507476806640625, -0.414306640625, -0.321136474609375, -0.22796630859375, -0.134796142578125, -0.0416259765625, 0.051544189453125, 0.14471435546875, 0.237884521484375, 0.3310546875, 0.424224853515625, 0.51739501953125, 0.610565185546875, 0.7037353515625, 0.796905517578125, 0.89007568359375, 0.983245849609375, 1.076416015625, 1.169586181640625, 1.26275634765625, 1.355926513671875, 1.4490966796875, 1.542266845703125, 1.63543701171875, 1.728607177734375, 1.82177734375, 1.914947509765625, 2.00811767578125, 2.101287841796875, 2.1944580078125, 2.287628173828125, 2.38079833984375, 2.473968505859375, 2.567138671875, 2.660308837890625, 2.75347900390625, 2.846649169921875, 2.9398193359375, 3.032989501953125, 3.12615966796875, 3.219329833984375, 3.3125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 14.0, 13.0, 16.0, 25.0, 19.0, 39.0, 31.0, 36.0, 49.0, 34.0, 50.0, 56.0, 53.0, 40.0, 59.0, 48.0, 56.0, 34.0, 47.0, 47.0, 27.0, 18.0, 34.0, 22.0, 30.0, 17.0, 13.0, 12.0, 15.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.833251953125, -3.70166015625, -3.570068359375, -3.4384765625, -3.306884765625, -3.17529296875, -3.043701171875, -2.912109375, -2.780517578125, -2.64892578125, -2.517333984375, -2.3857421875, -2.254150390625, -2.12255859375, -1.990966796875, -1.859375, -1.727783203125, -1.59619140625, -1.464599609375, -1.3330078125, -1.201416015625, -1.06982421875, -0.938232421875, -0.806640625, -0.675048828125, -0.54345703125, -0.411865234375, -0.2802734375, -0.148681640625, -0.01708984375, 0.114501953125, 0.24609375, 0.377685546875, 0.50927734375, 0.640869140625, 0.7724609375, 0.904052734375, 1.03564453125, 1.167236328125, 1.298828125, 1.430419921875, 1.56201171875, 1.693603515625, 1.8251953125, 1.956787109375, 2.08837890625, 2.219970703125, 2.3515625, 2.483154296875, 2.61474609375, 2.746337890625, 2.8779296875, 3.009521484375, 3.14111328125, 3.272705078125, 3.404296875, 3.535888671875, 3.66748046875, 3.799072265625, 3.9306640625, 4.062255859375, 4.19384765625, 4.325439453125, 4.45703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 4.0, 9.0, 19.0, 19.0, 55.0, 106.0, 355.0, 1277.0, 7377.0, 182769.0, 830307.0, 22913.0, 2486.0, 509.0, 182.0, 82.0, 37.0, 19.0, 9.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6546478271484375, -1.591522216796875, -1.5283966064453125, -1.46527099609375, -1.4021453857421875, -1.339019775390625, -1.2758941650390625, -1.2127685546875, -1.1496429443359375, -1.086517333984375, -1.0233917236328125, -0.96026611328125, -0.8971405029296875, -0.834014892578125, -0.7708892822265625, -0.707763671875, -0.6446380615234375, -0.581512451171875, -0.5183868408203125, -0.45526123046875, -0.3921356201171875, -0.329010009765625, -0.2658843994140625, -0.2027587890625, -0.1396331787109375, -0.076507568359375, -0.0133819580078125, 0.04974365234375, 0.1128692626953125, 0.175994873046875, 0.2391204833984375, 0.30224609375, 0.3653717041015625, 0.428497314453125, 0.4916229248046875, 0.55474853515625, 0.6178741455078125, 0.680999755859375, 0.7441253662109375, 0.8072509765625, 0.8703765869140625, 0.933502197265625, 0.9966278076171875, 1.05975341796875, 1.1228790283203125, 1.186004638671875, 1.2491302490234375, 1.312255859375, 1.3753814697265625, 1.438507080078125, 1.5016326904296875, 1.56475830078125, 1.6278839111328125, 1.691009521484375, 1.7541351318359375, 1.8172607421875, 1.8803863525390625, 1.943511962890625, 2.0066375732421875, 2.06976318359375, 2.1328887939453125, 2.196014404296875, 2.2591400146484375, 2.322265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 10.0, 10.0, 8.0, 14.0, 23.0, 22.0, 37.0, 36.0, 33.0, 57.0, 63.0, 75.0, 114.0, 90.0, 71.0, 53.0, 56.0, 37.0, 28.0, 33.0, 22.0, 27.0, 17.0, 14.0, 13.0, 7.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020265579223632812, -0.0001956634223461151, -0.0001886710524559021, -0.0001816786825656891, -0.00017468631267547607, -0.00016769394278526306, -0.00016070157289505005, -0.00015370920300483704, -0.00014671683311462402, -0.000139724463224411, -0.000132732093334198, -0.00012573972344398499, -0.00011874735355377197, -0.00011175498366355896, -0.00010476261377334595, -9.777024388313293e-05, -9.077787399291992e-05, -8.378550410270691e-05, -7.67931342124939e-05, -6.980076432228088e-05, -6.280839443206787e-05, -5.581602454185486e-05, -4.8823654651641846e-05, -4.183128476142883e-05, -3.483891487121582e-05, -2.7846544981002808e-05, -2.0854175090789795e-05, -1.3861805200576782e-05, -6.8694353103637695e-06, 1.2293457984924316e-07, 7.115304470062256e-06, 1.4107674360275269e-05, 2.110004425048828e-05, 2.8092414140701294e-05, 3.508478403091431e-05, 4.207715392112732e-05, 4.906952381134033e-05, 5.6061893701553345e-05, 6.305426359176636e-05, 7.004663348197937e-05, 7.703900337219238e-05, 8.40313732624054e-05, 9.102374315261841e-05, 9.801611304283142e-05, 0.00010500848293304443, 0.00011200085282325745, 0.00011899322271347046, 0.00012598559260368347, 0.00013297796249389648, 0.0001399703323841095, 0.0001469627022743225, 0.00015395507216453552, 0.00016094744205474854, 0.00016793981194496155, 0.00017493218183517456, 0.00018192455172538757, 0.00018891692161560059, 0.0001959092915058136, 0.0002029016613960266, 0.00020989403128623962, 0.00021688640117645264, 0.00022387877106666565, 0.00023087114095687866, 0.00023786351084709167, 0.0002448558807373047]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 11.0, 18.0, 27.0, 31.0, 55.0, 73.0, 165.0, 299.0, 582.0, 1403.0, 3548.0, 13446.0, 98406.0, 751780.0, 152901.0, 18415.0, 4359.0, 1579.0, 660.0, 311.0, 173.0, 118.0, 67.0, 46.0, 24.0, 11.0, 13.0, 7.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.8978729248046875, -0.864105224609375, -0.8303375244140625, -0.79656982421875, -0.7628021240234375, -0.729034423828125, -0.6952667236328125, -0.6614990234375, -0.6277313232421875, -0.593963623046875, -0.5601959228515625, -0.52642822265625, -0.4926605224609375, -0.458892822265625, -0.4251251220703125, -0.391357421875, -0.3575897216796875, -0.323822021484375, -0.2900543212890625, -0.25628662109375, -0.2225189208984375, -0.188751220703125, -0.1549835205078125, -0.1212158203125, -0.0874481201171875, -0.053680419921875, -0.0199127197265625, 0.01385498046875, 0.0476226806640625, 0.081390380859375, 0.1151580810546875, 0.14892578125, 0.1826934814453125, 0.216461181640625, 0.2502288818359375, 0.28399658203125, 0.3177642822265625, 0.351531982421875, 0.3852996826171875, 0.4190673828125, 0.4528350830078125, 0.486602783203125, 0.5203704833984375, 0.55413818359375, 0.5879058837890625, 0.621673583984375, 0.6554412841796875, 0.689208984375, 0.7229766845703125, 0.756744384765625, 0.7905120849609375, 0.82427978515625, 0.8580474853515625, 0.891815185546875, 0.9255828857421875, 0.9593505859375, 0.9931182861328125, 1.026885986328125, 1.0606536865234375, 1.09442138671875, 1.1281890869140625, 1.161956787109375, 1.1957244873046875, 1.2294921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 9.0, 7.0, 7.0, 14.0, 18.0, 24.0, 20.0, 33.0, 40.0, 52.0, 72.0, 66.0, 72.0, 83.0, 69.0, 67.0, 66.0, 56.0, 46.0, 44.0, 33.0, 27.0, 19.0, 9.0, 11.0, 11.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69580078125, -0.6655807495117188, -0.6353607177734375, -0.6051406860351562, -0.574920654296875, -0.5447006225585938, -0.5144805908203125, -0.48426055908203125, -0.45404052734375, -0.42382049560546875, -0.3936004638671875, -0.36338043212890625, -0.333160400390625, -0.30294036865234375, -0.2727203369140625, -0.24250030517578125, -0.2122802734375, -0.18206024169921875, -0.1518402099609375, -0.12162017822265625, -0.091400146484375, -0.06118011474609375, -0.0309600830078125, -0.00074005126953125, 0.02947998046875, 0.05970001220703125, 0.0899200439453125, 0.12014007568359375, 0.150360107421875, 0.18058013916015625, 0.2108001708984375, 0.24102020263671875, 0.271240234375, 0.30146026611328125, 0.3316802978515625, 0.36190032958984375, 0.392120361328125, 0.42234039306640625, 0.4525604248046875, 0.48278045654296875, 0.51300048828125, 0.5432205200195312, 0.5734405517578125, 0.6036605834960938, 0.633880615234375, 0.6641006469726562, 0.6943206787109375, 0.7245407104492188, 0.7547607421875, 0.7849807739257812, 0.8152008056640625, 0.8454208374023438, 0.875640869140625, 0.9058609008789062, 0.9360809326171875, 0.9663009643554688, 0.99652099609375, 1.0267410278320312, 1.0569610595703125, 1.0871810913085938, 1.117401123046875, 1.1476211547851562, 1.1778411865234375, 1.2080612182617188, 1.23828125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 3.0, 1.0, 1.0, 2.0, 8.0, 17.0, 26.0, 60.0, 113.0, 199.0, 259.0, 166.0, 87.0, 26.0, 20.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.236351013183594, -24.37698745727539, -23.51762580871582, -22.658262252807617, -21.798900604248047, -20.939537048339844, -20.080175399780273, -19.22081184387207, -18.3614501953125, -17.502086639404297, -16.642724990844727, -15.78336238861084, -14.923999786376953, -14.06463623046875, -13.20527458190918, -12.345911026000977, -11.48654842376709, -10.627185821533203, -9.767823219299316, -8.90846061706543, -8.049098014831543, -7.189734935760498, -6.330372333526611, -5.471009731292725, -4.611647129058838, -3.752284526824951, -2.8929219245910645, -2.0335590839385986, -1.174196481704712, -0.3148336410522461, 0.5445289611816406, 1.4038915634155273, 2.263254165649414, 3.122616767883301, 3.9819793701171875, 4.841341972351074, 5.700704574584961, 6.560067653656006, 7.419430255889893, 8.278793334960938, 9.138154983520508, 9.997517585754395, 10.856880187988281, 11.716242790222168, 12.575605392456055, 13.434968948364258, 14.294330596923828, 15.153694152832031, 16.013057708740234, 16.872421264648438, 17.731782913208008, 18.59114646911621, 19.45050811767578, 20.309871673583984, 21.169233322143555, 22.028596878051758, 22.887958526611328, 23.74732208251953, 24.6066837310791, 25.466047286987305, 26.325408935546875, 27.184772491455078, 28.04413414001465, 28.90349769592285, 29.762859344482422]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 6.0, 4.0, 7.0, 13.0, 18.0, 12.0, 17.0, 16.0, 36.0, 32.0, 31.0, 32.0, 42.0, 32.0, 46.0, 48.0, 70.0, 78.0, 66.0, 58.0, 53.0, 39.0, 30.0, 32.0, 28.0, 29.0, 17.0, 20.0, 14.0, 16.0, 10.0, 15.0, 8.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.957334518432617, -15.446669578552246, -14.936004638671875, -14.425338745117188, -13.914673805236816, -13.404008865356445, -12.893342971801758, -12.382678031921387, -11.872013092041016, -11.361348152160645, -10.850683212280273, -10.340017318725586, -9.829352378845215, -9.318687438964844, -8.808021545410156, -8.297356605529785, -7.786691665649414, -7.276026725769043, -6.765361309051514, -6.254695892333984, -5.744030952453613, -5.233366012573242, -4.722700595855713, -4.212035179138184, -3.7013702392578125, -3.1907050609588623, -2.680039882659912, -2.169374704360962, -1.6587095260620117, -1.1480443477630615, -0.6373791694641113, -0.12671399116516113, 0.38395118713378906, 0.8946163654327393, 1.4052815437316895, 1.9159467220306396, 2.42661190032959, 2.93727707862854, 3.4479422569274902, 3.9586074352264404, 4.469272613525391, 4.979937553405762, 5.490602970123291, 6.00126838684082, 6.511933326721191, 7.0225982666015625, 7.533263683319092, 8.043929100036621, 8.554594039916992, 9.065258979797363, 9.575923919677734, 10.086589813232422, 10.597254753112793, 11.107919692993164, 11.618585586547852, 12.129250526428223, 12.639915466308594, 13.150580406188965, 13.661245346069336, 14.171911239624023, 14.682576179504395, 15.193241119384766, 15.703907012939453, 16.214570999145508, 16.725236892700195]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 5.0, 13.0, 25.0, 25.0, 62.0, 152.0, 350.0, 745.0, 1970.0, 5085.0, 14559.0, 49093.0, 230453.0, 1381118.0, 2020275.0, 387480.0, 71666.0, 19997.0, 6809.0, 2533.0, 1030.0, 421.0, 171.0, 104.0, 45.0, 33.0, 14.0, 15.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.992095947265625, -0.95684814453125, -0.921600341796875, -0.8863525390625, -0.851104736328125, -0.81585693359375, -0.780609130859375, -0.745361328125, -0.710113525390625, -0.67486572265625, -0.639617919921875, -0.6043701171875, -0.569122314453125, -0.53387451171875, -0.498626708984375, -0.46337890625, -0.428131103515625, -0.39288330078125, -0.357635498046875, -0.3223876953125, -0.287139892578125, -0.25189208984375, -0.216644287109375, -0.181396484375, -0.146148681640625, -0.11090087890625, -0.075653076171875, -0.0404052734375, -0.005157470703125, 0.03009033203125, 0.065338134765625, 0.1005859375, 0.135833740234375, 0.17108154296875, 0.206329345703125, 0.2415771484375, 0.276824951171875, 0.31207275390625, 0.347320556640625, 0.382568359375, 0.417816162109375, 0.45306396484375, 0.488311767578125, 0.5235595703125, 0.558807373046875, 0.59405517578125, 0.629302978515625, 0.66455078125, 0.699798583984375, 0.73504638671875, 0.770294189453125, 0.8055419921875, 0.840789794921875, 0.87603759765625, 0.911285400390625, 0.946533203125, 0.981781005859375, 1.01702880859375, 1.052276611328125, 1.0875244140625, 1.122772216796875, 1.15802001953125, 1.193267822265625, 1.228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 3.0, 11.0, 6.0, 20.0, 21.0, 21.0, 20.0, 32.0, 29.0, 27.0, 47.0, 44.0, 40.0, 42.0, 43.0, 43.0, 56.0, 51.0, 47.0, 45.0, 46.0, 34.0, 33.0, 35.0, 37.0, 19.0, 20.0, 20.0, 16.0, 14.0, 14.0, 8.0, 9.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8759765625, -0.8498077392578125, -0.823638916015625, -0.7974700927734375, -0.77130126953125, -0.7451324462890625, -0.718963623046875, -0.6927947998046875, -0.6666259765625, -0.6404571533203125, -0.614288330078125, -0.5881195068359375, -0.56195068359375, -0.5357818603515625, -0.509613037109375, -0.4834442138671875, -0.457275390625, -0.4311065673828125, -0.404937744140625, -0.3787689208984375, -0.35260009765625, -0.3264312744140625, -0.300262451171875, -0.2740936279296875, -0.2479248046875, -0.2217559814453125, -0.195587158203125, -0.1694183349609375, -0.14324951171875, -0.1170806884765625, -0.090911865234375, -0.0647430419921875, -0.03857421875, -0.0124053955078125, 0.013763427734375, 0.0399322509765625, 0.06610107421875, 0.0922698974609375, 0.118438720703125, 0.1446075439453125, 0.1707763671875, 0.1969451904296875, 0.223114013671875, 0.2492828369140625, 0.27545166015625, 0.3016204833984375, 0.327789306640625, 0.3539581298828125, 0.380126953125, 0.4062957763671875, 0.432464599609375, 0.4586334228515625, 0.48480224609375, 0.5109710693359375, 0.537139892578125, 0.5633087158203125, 0.5894775390625, 0.6156463623046875, 0.641815185546875, 0.6679840087890625, 0.69415283203125, 0.7203216552734375, 0.746490478515625, 0.7726593017578125, 0.798828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 17.0, 12.0, 12.0, 16.0, 32.0, 49.0, 68.0, 152.0, 244.0, 565.0, 1138.0, 3250.0, 9895.0, 39838.0, 241321.0, 2922117.0, 864971.0, 84459.0, 18006.0, 4971.0, 1627.0, 683.0, 346.0, 189.0, 102.0, 56.0, 39.0, 36.0, 21.0, 15.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.24609375, -2.1865692138671875, -2.127044677734375, -2.0675201416015625, -2.00799560546875, -1.9484710693359375, -1.888946533203125, -1.8294219970703125, -1.7698974609375, -1.7103729248046875, -1.650848388671875, -1.5913238525390625, -1.53179931640625, -1.4722747802734375, -1.412750244140625, -1.3532257080078125, -1.293701171875, -1.2341766357421875, -1.174652099609375, -1.1151275634765625, -1.05560302734375, -0.9960784912109375, -0.936553955078125, -0.8770294189453125, -0.8175048828125, -0.7579803466796875, -0.698455810546875, -0.6389312744140625, -0.57940673828125, -0.5198822021484375, -0.460357666015625, -0.4008331298828125, -0.34130859375, -0.2817840576171875, -0.222259521484375, -0.1627349853515625, -0.10321044921875, -0.0436859130859375, 0.015838623046875, 0.0753631591796875, 0.1348876953125, 0.1944122314453125, 0.253936767578125, 0.3134613037109375, 0.37298583984375, 0.4325103759765625, 0.492034912109375, 0.5515594482421875, 0.611083984375, 0.6706085205078125, 0.730133056640625, 0.7896575927734375, 0.84918212890625, 0.9087066650390625, 0.968231201171875, 1.0277557373046875, 1.0872802734375, 1.1468048095703125, 1.206329345703125, 1.2658538818359375, 1.32537841796875, 1.3849029541015625, 1.444427490234375, 1.5039520263671875, 1.5634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 8.0, 12.0, 11.0, 8.0, 17.0, 27.0, 43.0, 50.0, 61.0, 87.0, 104.0, 152.0, 223.0, 335.0, 442.0, 563.0, 554.0, 398.0, 279.0, 184.0, 127.0, 92.0, 58.0, 51.0, 39.0, 25.0, 31.0, 21.0, 11.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6572265625, -1.601287841796875, -1.54534912109375, -1.489410400390625, -1.4334716796875, -1.377532958984375, -1.32159423828125, -1.265655517578125, -1.209716796875, -1.153778076171875, -1.09783935546875, -1.041900634765625, -0.9859619140625, -0.930023193359375, -0.87408447265625, -0.818145751953125, -0.76220703125, -0.706268310546875, -0.65032958984375, -0.594390869140625, -0.5384521484375, -0.482513427734375, -0.42657470703125, -0.370635986328125, -0.314697265625, -0.258758544921875, -0.20281982421875, -0.146881103515625, -0.0909423828125, -0.035003662109375, 0.02093505859375, 0.076873779296875, 0.1328125, 0.188751220703125, 0.24468994140625, 0.300628662109375, 0.3565673828125, 0.412506103515625, 0.46844482421875, 0.524383544921875, 0.580322265625, 0.636260986328125, 0.69219970703125, 0.748138427734375, 0.8040771484375, 0.860015869140625, 0.91595458984375, 0.971893310546875, 1.02783203125, 1.083770751953125, 1.13970947265625, 1.195648193359375, 1.2515869140625, 1.307525634765625, 1.36346435546875, 1.419403076171875, 1.475341796875, 1.531280517578125, 1.58721923828125, 1.643157958984375, 1.6990966796875, 1.755035400390625, 1.81097412109375, 1.866912841796875, 1.9228515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 17.0, 59.0, 265.0, 383.0, 176.0, 50.0, 21.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.37917709350586, -37.024932861328125, -35.670684814453125, -34.31644058227539, -32.962196350097656, -31.607952117919922, -30.253705978393555, -28.899459838867188, -27.545215606689453, -26.19097137451172, -24.83672523498535, -23.482479095458984, -22.12823486328125, -20.773990631103516, -19.41974449157715, -18.06549835205078, -16.711254119873047, -15.357008934020996, -14.002763748168945, -12.648518562316895, -11.294273376464844, -9.940028190612793, -8.585783004760742, -7.231537818908691, -5.877292633056641, -4.52304744720459, -3.168802261352539, -1.8145570755004883, -0.4603118896484375, 0.8939332962036133, 2.248178482055664, 3.602423667907715, 4.956672668457031, 6.310917854309082, 7.665163040161133, 9.019408226013184, 10.373653411865234, 11.727898597717285, 13.082143783569336, 14.436388969421387, 15.790634155273438, 17.144878387451172, 18.49912452697754, 19.853370666503906, 21.20761489868164, 22.561859130859375, 23.916105270385742, 25.27035140991211, 26.624595642089844, 27.978839874267578, 29.333086013793945, 30.687332153320312, 32.04157638549805, 33.39582061767578, 34.75006866455078, 36.104312896728516, 37.45855712890625, 38.812801361083984, 40.16704559326172, 41.52129364013672, 42.87553787231445, 44.22978210449219, 45.58403015136719, 46.93827438354492, 48.292518615722656]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 2.0, 6.0, 9.0, 8.0, 12.0, 10.0, 20.0, 23.0, 24.0, 33.0, 35.0, 47.0, 52.0, 52.0, 70.0, 68.0, 50.0, 49.0, 57.0, 57.0, 35.0, 57.0, 39.0, 31.0, 33.0, 29.0, 19.0, 11.0, 21.0, 12.0, 7.0, 7.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.817249298095703, -14.404088973999023, -13.99092960357666, -13.577770233154297, -13.164609909057617, -12.751449584960938, -12.338290214538574, -11.925130844116211, -11.511970520019531, -11.098810195922852, -10.685650825500488, -10.272491455078125, -9.859331130981445, -9.446170806884766, -9.033011436462402, -8.619852066040039, -8.20669174194336, -7.793531894683838, -7.380372047424316, -6.967212200164795, -6.554052352905273, -6.140892505645752, -5.7277326583862305, -5.314572811126709, -4.9014129638671875, -4.488253116607666, -4.0750932693481445, -3.661933422088623, -3.2487735748291016, -2.83561372756958, -2.4224538803100586, -2.009294033050537, -1.5961341857910156, -1.1829743385314941, -0.7698144912719727, -0.35665464401245117, 0.05650520324707031, 0.4696650505065918, 0.8828248977661133, 1.2959847450256348, 1.7091445922851562, 2.1223044395446777, 2.535464286804199, 2.9486241340637207, 3.361783981323242, 3.7749438285827637, 4.188103675842285, 4.601263523101807, 5.014423370361328, 5.42758321762085, 5.840743064880371, 6.253902912139893, 6.667062759399414, 7.0802226066589355, 7.493382453918457, 7.9065423011779785, 8.3197021484375, 8.73286247253418, 9.146021842956543, 9.559181213378906, 9.972341537475586, 10.385501861572266, 10.798661231994629, 11.211820602416992, 11.624980926513672]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 15.0, 17.0, 28.0, 59.0, 122.0, 238.0, 387.0, 799.0, 1661.0, 3638.0, 8420.0, 20853.0, 52765.0, 135162.0, 300774.0, 300020.0, 134951.0, 52991.0, 20317.0, 8358.0, 3590.0, 1677.0, 847.0, 391.0, 205.0, 105.0, 70.0, 34.0, 18.0, 14.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.630859375, -1.5782470703125, -1.525634765625, -1.4730224609375, -1.42041015625, -1.3677978515625, -1.315185546875, -1.2625732421875, -1.2099609375, -1.1573486328125, -1.104736328125, -1.0521240234375, -0.99951171875, -0.9468994140625, -0.894287109375, -0.8416748046875, -0.7890625, -0.7364501953125, -0.683837890625, -0.6312255859375, -0.57861328125, -0.5260009765625, -0.473388671875, -0.4207763671875, -0.3681640625, -0.3155517578125, -0.262939453125, -0.2103271484375, -0.15771484375, -0.1051025390625, -0.052490234375, 0.0001220703125, 0.052734375, 0.1053466796875, 0.157958984375, 0.2105712890625, 0.26318359375, 0.3157958984375, 0.368408203125, 0.4210205078125, 0.4736328125, 0.5262451171875, 0.578857421875, 0.6314697265625, 0.68408203125, 0.7366943359375, 0.789306640625, 0.8419189453125, 0.89453125, 0.9471435546875, 0.999755859375, 1.0523681640625, 1.10498046875, 1.1575927734375, 1.210205078125, 1.2628173828125, 1.3154296875, 1.3680419921875, 1.420654296875, 1.4732666015625, 1.52587890625, 1.5784912109375, 1.631103515625, 1.6837158203125, 1.736328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 7.0, 10.0, 5.0, 12.0, 17.0, 17.0, 26.0, 19.0, 33.0, 29.0, 17.0, 30.0, 37.0, 45.0, 42.0, 52.0, 53.0, 40.0, 52.0, 52.0, 51.0, 48.0, 38.0, 48.0, 30.0, 33.0, 17.0, 17.0, 22.0, 18.0, 18.0, 8.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8505859375, -0.8228836059570312, -0.7951812744140625, -0.7674789428710938, -0.739776611328125, -0.7120742797851562, -0.6843719482421875, -0.6566696166992188, -0.62896728515625, -0.6012649536132812, -0.5735626220703125, -0.5458602905273438, -0.518157958984375, -0.49045562744140625, -0.4627532958984375, -0.43505096435546875, -0.4073486328125, -0.37964630126953125, -0.3519439697265625, -0.32424163818359375, -0.296539306640625, -0.26883697509765625, -0.2411346435546875, -0.21343231201171875, -0.18572998046875, -0.15802764892578125, -0.1303253173828125, -0.10262298583984375, -0.074920654296875, -0.04721832275390625, -0.0195159912109375, 0.00818634033203125, 0.035888671875, 0.06359100341796875, 0.0912933349609375, 0.11899566650390625, 0.146697998046875, 0.17440032958984375, 0.2021026611328125, 0.22980499267578125, 0.25750732421875, 0.28520965576171875, 0.3129119873046875, 0.34061431884765625, 0.368316650390625, 0.39601898193359375, 0.4237213134765625, 0.45142364501953125, 0.4791259765625, 0.5068283081054688, 0.5345306396484375, 0.5622329711914062, 0.589935302734375, 0.6176376342773438, 0.6453399658203125, 0.6730422973632812, 0.70074462890625, 0.7284469604492188, 0.7561492919921875, 0.7838516235351562, 0.811553955078125, 0.8392562866210938, 0.8669586181640625, 0.8946609497070312, 0.92236328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 7.0, 8.0, 14.0, 24.0, 23.0, 31.0, 46.0, 72.0, 85.0, 133.0, 199.0, 280.0, 465.0, 778.0, 1562.0, 3737.0, 13000.0, 79689.0, 666690.0, 239086.0, 30933.0, 6546.0, 2344.0, 1129.0, 588.0, 333.0, 223.0, 148.0, 102.0, 78.0, 58.0, 32.0, 26.0, 25.0, 19.0, 7.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.36285400390625, -3.2569580078125, -3.15106201171875, -3.045166015625, -2.93927001953125, -2.8333740234375, -2.72747802734375, -2.62158203125, -2.51568603515625, -2.4097900390625, -2.30389404296875, -2.197998046875, -2.09210205078125, -1.9862060546875, -1.88031005859375, -1.7744140625, -1.66851806640625, -1.5626220703125, -1.45672607421875, -1.350830078125, -1.24493408203125, -1.1390380859375, -1.03314208984375, -0.92724609375, -0.82135009765625, -0.7154541015625, -0.60955810546875, -0.503662109375, -0.39776611328125, -0.2918701171875, -0.18597412109375, -0.080078125, 0.02581787109375, 0.1317138671875, 0.23760986328125, 0.343505859375, 0.44940185546875, 0.5552978515625, 0.66119384765625, 0.76708984375, 0.87298583984375, 0.9788818359375, 1.08477783203125, 1.190673828125, 1.29656982421875, 1.4024658203125, 1.50836181640625, 1.6142578125, 1.72015380859375, 1.8260498046875, 1.93194580078125, 2.037841796875, 2.14373779296875, 2.2496337890625, 2.35552978515625, 2.46142578125, 2.56732177734375, 2.6732177734375, 2.77911376953125, 2.885009765625, 2.99090576171875, 3.0968017578125, 3.20269775390625, 3.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 1.0, 10.0, 14.0, 16.0, 17.0, 24.0, 27.0, 35.0, 46.0, 58.0, 65.0, 66.0, 44.0, 55.0, 62.0, 61.0, 62.0, 42.0, 56.0, 46.0, 40.0, 25.0, 24.0, 25.0, 14.0, 9.0, 12.0, 11.0, 1.0, 5.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.43243408203125, -4.2984619140625, -4.16448974609375, -4.030517578125, -3.89654541015625, -3.7625732421875, -3.62860107421875, -3.49462890625, -3.36065673828125, -3.2266845703125, -3.09271240234375, -2.958740234375, -2.82476806640625, -2.6907958984375, -2.55682373046875, -2.4228515625, -2.28887939453125, -2.1549072265625, -2.02093505859375, -1.886962890625, -1.75299072265625, -1.6190185546875, -1.48504638671875, -1.35107421875, -1.21710205078125, -1.0831298828125, -0.94915771484375, -0.815185546875, -0.68121337890625, -0.5472412109375, -0.41326904296875, -0.279296875, -0.14532470703125, -0.0113525390625, 0.12261962890625, 0.256591796875, 0.39056396484375, 0.5245361328125, 0.65850830078125, 0.79248046875, 0.92645263671875, 1.0604248046875, 1.19439697265625, 1.328369140625, 1.46234130859375, 1.5963134765625, 1.73028564453125, 1.8642578125, 1.99822998046875, 2.1322021484375, 2.26617431640625, 2.400146484375, 2.53411865234375, 2.6680908203125, 2.80206298828125, 2.93603515625, 3.07000732421875, 3.2039794921875, 3.33795166015625, 3.471923828125, 3.60589599609375, 3.7398681640625, 3.87384033203125, 4.0078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 3.0, 3.0, 8.0, 9.0, 8.0, 16.0, 15.0, 29.0, 32.0, 43.0, 67.0, 112.0, 149.0, 262.0, 468.0, 927.0, 1984.0, 5103.0, 17309.0, 79291.0, 539023.0, 319086.0, 62238.0, 14171.0, 4475.0, 1771.0, 763.0, 464.0, 254.0, 119.0, 86.0, 63.0, 64.0, 31.0, 17.0, 22.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7913055419921875, -0.765716552734375, -0.7401275634765625, -0.71453857421875, -0.6889495849609375, -0.663360595703125, -0.6377716064453125, -0.6121826171875, -0.5865936279296875, -0.561004638671875, -0.5354156494140625, -0.50982666015625, -0.4842376708984375, -0.458648681640625, -0.4330596923828125, -0.407470703125, -0.3818817138671875, -0.356292724609375, -0.3307037353515625, -0.30511474609375, -0.2795257568359375, -0.253936767578125, -0.2283477783203125, -0.2027587890625, -0.1771697998046875, -0.151580810546875, -0.1259918212890625, -0.10040283203125, -0.0748138427734375, -0.049224853515625, -0.0236358642578125, 0.001953125, 0.0275421142578125, 0.053131103515625, 0.0787200927734375, 0.10430908203125, 0.1298980712890625, 0.155487060546875, 0.1810760498046875, 0.2066650390625, 0.2322540283203125, 0.257843017578125, 0.2834320068359375, 0.30902099609375, 0.3346099853515625, 0.360198974609375, 0.3857879638671875, 0.411376953125, 0.4369659423828125, 0.462554931640625, 0.4881439208984375, 0.51373291015625, 0.5393218994140625, 0.564910888671875, 0.5904998779296875, 0.6160888671875, 0.6416778564453125, 0.667266845703125, 0.6928558349609375, 0.71844482421875, 0.7440338134765625, 0.769622802734375, 0.7952117919921875, 0.82080078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 8.0, 6.0, 10.0, 11.0, 25.0, 25.0, 30.0, 28.0, 52.0, 60.0, 84.0, 96.0, 106.0, 89.0, 84.0, 69.0, 49.0, 35.0, 29.0, 19.0, 15.0, 11.0, 18.0, 12.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002582073211669922, -0.00024978071451187134, -0.0002413541078567505, -0.00023292750120162964, -0.0002245008945465088, -0.00021607428789138794, -0.0002076476812362671, -0.00019922107458114624, -0.0001907944679260254, -0.00018236786127090454, -0.0001739412546157837, -0.00016551464796066284, -0.000157088041305542, -0.00014866143465042114, -0.0001402348279953003, -0.00013180822134017944, -0.0001233816146850586, -0.00011495500802993774, -0.0001065284013748169, -9.810179471969604e-05, -8.96751880645752e-05, -8.124858140945435e-05, -7.28219747543335e-05, -6.439536809921265e-05, -5.59687614440918e-05, -4.754215478897095e-05, -3.91155481338501e-05, -3.068894147872925e-05, -2.22623348236084e-05, -1.3835728168487549e-05, -5.409121513366699e-06, 3.0174851417541504e-06, 1.1444091796875e-05, 1.987069845199585e-05, 2.82973051071167e-05, 3.672391176223755e-05, 4.51505184173584e-05, 5.357712507247925e-05, 6.20037317276001e-05, 7.043033838272095e-05, 7.88569450378418e-05, 8.728355169296265e-05, 9.57101583480835e-05, 0.00010413676500320435, 0.0001125633716583252, 0.00012098997831344604, 0.0001294165849685669, 0.00013784319162368774, 0.0001462697982788086, 0.00015469640493392944, 0.0001631230115890503, 0.00017154961824417114, 0.000179976224899292, 0.00018840283155441284, 0.0001968294382095337, 0.00020525604486465454, 0.0002136826515197754, 0.00022210925817489624, 0.0002305358648300171, 0.00023896247148513794, 0.0002473890781402588, 0.00025581568479537964, 0.0002642422914505005, 0.00027266889810562134, 0.0002810955047607422]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 11.0, 8.0, 13.0, 18.0, 27.0, 38.0, 73.0, 104.0, 200.0, 363.0, 813.0, 1802.0, 5419.0, 25837.0, 236634.0, 688404.0, 72861.0, 10663.0, 2935.0, 1125.0, 533.0, 278.0, 151.0, 87.0, 47.0, 34.0, 18.0, 17.0, 9.0, 7.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.999267578125, -0.96728515625, -0.935302734375, -0.9033203125, -0.871337890625, -0.83935546875, -0.807373046875, -0.775390625, -0.743408203125, -0.71142578125, -0.679443359375, -0.6474609375, -0.615478515625, -0.58349609375, -0.551513671875, -0.51953125, -0.487548828125, -0.45556640625, -0.423583984375, -0.3916015625, -0.359619140625, -0.32763671875, -0.295654296875, -0.263671875, -0.231689453125, -0.19970703125, -0.167724609375, -0.1357421875, -0.103759765625, -0.07177734375, -0.039794921875, -0.0078125, 0.024169921875, 0.05615234375, 0.088134765625, 0.1201171875, 0.152099609375, 0.18408203125, 0.216064453125, 0.248046875, 0.280029296875, 0.31201171875, 0.343994140625, 0.3759765625, 0.407958984375, 0.43994140625, 0.471923828125, 0.50390625, 0.535888671875, 0.56787109375, 0.599853515625, 0.6318359375, 0.663818359375, 0.69580078125, 0.727783203125, 0.759765625, 0.791748046875, 0.82373046875, 0.855712890625, 0.8876953125, 0.919677734375, 0.95166015625, 0.983642578125, 1.015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 10.0, 8.0, 11.0, 15.0, 23.0, 28.0, 46.0, 45.0, 64.0, 80.0, 81.0, 94.0, 93.0, 77.0, 72.0, 57.0, 58.0, 47.0, 27.0, 15.0, 15.0, 10.0, 7.0, 8.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1439743041992188, -1.1131439208984375, -1.0823135375976562, -1.051483154296875, -1.0206527709960938, -0.9898223876953125, -0.9589920043945312, -0.92816162109375, -0.8973312377929688, -0.8665008544921875, -0.8356704711914062, -0.804840087890625, -0.7740097045898438, -0.7431793212890625, -0.7123489379882812, -0.6815185546875, -0.6506881713867188, -0.6198577880859375, -0.5890274047851562, -0.558197021484375, -0.5273666381835938, -0.4965362548828125, -0.46570587158203125, -0.43487548828125, -0.40404510498046875, -0.3732147216796875, -0.34238433837890625, -0.311553955078125, -0.28072357177734375, -0.2498931884765625, -0.21906280517578125, -0.188232421875, -0.15740203857421875, -0.1265716552734375, -0.09574127197265625, -0.064910888671875, -0.03408050537109375, -0.0032501220703125, 0.02758026123046875, 0.05841064453125, 0.08924102783203125, 0.1200714111328125, 0.15090179443359375, 0.181732177734375, 0.21256256103515625, 0.2433929443359375, 0.27422332763671875, 0.3050537109375, 0.33588409423828125, 0.3667144775390625, 0.39754486083984375, 0.428375244140625, 0.45920562744140625, 0.4900360107421875, 0.5208663940429688, 0.55169677734375, 0.5825271606445312, 0.6133575439453125, 0.6441879272460938, 0.675018310546875, 0.7058486938476562, 0.7366790771484375, 0.7675094604492188, 0.79833984375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 14.0, 35.0, 49.0, 89.0, 143.0, 241.0, 162.0, 97.0, 81.0, 31.0, 17.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.46628189086914, -22.787492752075195, -22.10870361328125, -21.429916381835938, -20.751127243041992, -20.072338104248047, -19.3935489654541, -18.714759826660156, -18.035972595214844, -17.3571834564209, -16.678394317626953, -15.999606132507324, -15.320817947387695, -14.64202880859375, -13.963239669799805, -13.284451484680176, -12.60566234588623, -11.926873207092285, -11.248085021972656, -10.569295883178711, -9.890507698059082, -9.211718559265137, -8.532930374145508, -7.8541412353515625, -7.175352573394775, -6.496563911437988, -5.817775249481201, -5.138986587524414, -4.460197448730469, -3.7814090251922607, -3.1026201248168945, -2.4238314628601074, -1.7450428009033203, -1.0662541389465332, -0.38746535778045654, 0.2913234233856201, 0.9701120853424072, 1.6489007472991943, 2.3276896476745605, 3.0064783096313477, 3.6852669715881348, 4.364055633544922, 5.042844295501709, 5.721632957458496, 6.400422096252441, 7.07921028137207, 7.757999420166016, 8.436788558959961, 9.11557674407959, 9.794365882873535, 10.473154067993164, 11.15194320678711, 11.830731391906738, 12.509520530700684, 13.188308715820312, 13.867097854614258, 14.545886993408203, 15.224676132202148, 15.903464317321777, 16.582252502441406, 17.26104164123535, 17.939830780029297, 18.618619918823242, 19.297409057617188, 19.9761962890625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 4.0, 11.0, 9.0, 13.0, 7.0, 17.0, 15.0, 13.0, 19.0, 25.0, 23.0, 28.0, 27.0, 35.0, 41.0, 48.0, 72.0, 66.0, 73.0, 64.0, 52.0, 41.0, 30.0, 33.0, 32.0, 27.0, 26.0, 18.0, 23.0, 24.0, 17.0, 9.0, 10.0, 8.0, 6.0, 6.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.696672439575195, -13.268020629882812, -12.83936882019043, -12.410717964172363, -11.98206615447998, -11.553414344787598, -11.124763488769531, -10.696111679077148, -10.267459869384766, -9.838808059692383, -9.41015625, -8.981505393981934, -8.55285358428955, -8.124201774597168, -7.695550441741943, -7.266899108886719, -6.838247299194336, -6.409595489501953, -5.9809441566467285, -5.552292823791504, -5.123641014099121, -4.694989204406738, -4.266337871551514, -3.83768630027771, -3.4090347290039062, -2.9803831577301025, -2.551731586456299, -2.123080015182495, -1.6944284439086914, -1.2657768726348877, -0.837125301361084, -0.4084737300872803, 0.020178794860839844, 0.44883036613464355, 0.8774819374084473, 1.306133508682251, 1.7347850799560547, 2.1634366512298584, 2.592088222503662, 3.020739793777466, 3.4493913650512695, 3.8780429363250732, 4.306694507598877, 4.735345840454102, 5.163997650146484, 5.592649459838867, 6.021300792694092, 6.449952125549316, 6.878603935241699, 7.307255744934082, 7.735907077789307, 8.164558410644531, 8.593210220336914, 9.021862030029297, 9.45051383972168, 9.879164695739746, 10.307816505432129, 10.736468315124512, 11.165119171142578, 11.593770980834961, 12.022422790527344, 12.451074600219727, 12.87972640991211, 13.308377265930176, 13.737029075622559]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 13.0, 14.0, 15.0, 14.0, 22.0, 34.0, 53.0, 52.0, 106.0, 158.0, 308.0, 671.0, 1601.0, 4078.0, 13659.0, 63166.0, 447574.0, 2217824.0, 1239799.0, 165566.0, 27650.0, 7213.0, 2532.0, 1015.0, 442.0, 239.0, 147.0, 97.0, 63.0, 34.0, 24.0, 19.0, 15.0, 16.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9137802124023438, -0.8768768310546875, -0.8399734497070312, -0.803070068359375, -0.7661666870117188, -0.7292633056640625, -0.6923599243164062, -0.65545654296875, -0.6185531616210938, -0.5816497802734375, -0.5447463989257812, -0.507843017578125, -0.47093963623046875, -0.4340362548828125, -0.39713287353515625, -0.3602294921875, -0.32332611083984375, -0.2864227294921875, -0.24951934814453125, -0.212615966796875, -0.17571258544921875, -0.1388092041015625, -0.10190582275390625, -0.06500244140625, -0.02809906005859375, 0.0088043212890625, 0.04570770263671875, 0.082611083984375, 0.11951446533203125, 0.1564178466796875, 0.19332122802734375, 0.230224609375, 0.26712799072265625, 0.3040313720703125, 0.34093475341796875, 0.377838134765625, 0.41474151611328125, 0.4516448974609375, 0.48854827880859375, 0.52545166015625, 0.5623550415039062, 0.5992584228515625, 0.6361618041992188, 0.673065185546875, 0.7099685668945312, 0.7468719482421875, 0.7837753295898438, 0.8206787109375, 0.8575820922851562, 0.8944854736328125, 0.9313888549804688, 0.968292236328125, 1.0051956176757812, 1.0420989990234375, 1.0790023803710938, 1.11590576171875, 1.1528091430664062, 1.1897125244140625, 1.2266159057617188, 1.263519287109375, 1.3004226684570312, 1.3373260498046875, 1.3742294311523438, 1.4111328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 8.0, 10.0, 14.0, 12.0, 17.0, 22.0, 25.0, 32.0, 30.0, 32.0, 28.0, 36.0, 30.0, 50.0, 49.0, 50.0, 35.0, 52.0, 52.0, 40.0, 46.0, 33.0, 34.0, 33.0, 34.0, 28.0, 17.0, 24.0, 23.0, 19.0, 14.0, 9.0, 9.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.83935546875, -0.814544677734375, -0.78973388671875, -0.764923095703125, -0.7401123046875, -0.715301513671875, -0.69049072265625, -0.665679931640625, -0.640869140625, -0.616058349609375, -0.59124755859375, -0.566436767578125, -0.5416259765625, -0.516815185546875, -0.49200439453125, -0.467193603515625, -0.4423828125, -0.417572021484375, -0.39276123046875, -0.367950439453125, -0.3431396484375, -0.318328857421875, -0.29351806640625, -0.268707275390625, -0.243896484375, -0.219085693359375, -0.19427490234375, -0.169464111328125, -0.1446533203125, -0.119842529296875, -0.09503173828125, -0.070220947265625, -0.04541015625, -0.020599365234375, 0.00421142578125, 0.029022216796875, 0.0538330078125, 0.078643798828125, 0.10345458984375, 0.128265380859375, 0.153076171875, 0.177886962890625, 0.20269775390625, 0.227508544921875, 0.2523193359375, 0.277130126953125, 0.30194091796875, 0.326751708984375, 0.3515625, 0.376373291015625, 0.40118408203125, 0.425994873046875, 0.4508056640625, 0.475616455078125, 0.50042724609375, 0.525238037109375, 0.550048828125, 0.574859619140625, 0.59967041015625, 0.624481201171875, 0.6492919921875, 0.674102783203125, 0.69891357421875, 0.723724365234375, 0.74853515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 23.0, 34.0, 43.0, 100.0, 167.0, 305.0, 583.0, 1236.0, 3579.0, 13651.0, 92051.0, 2492407.0, 1515235.0, 60065.0, 9897.0, 2711.0, 1027.0, 501.0, 257.0, 147.0, 87.0, 49.0, 35.0, 22.0, 11.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.531036376953125, -2.45855712890625, -2.386077880859375, -2.3135986328125, -2.241119384765625, -2.16864013671875, -2.096160888671875, -2.023681640625, -1.951202392578125, -1.87872314453125, -1.806243896484375, -1.7337646484375, -1.661285400390625, -1.58880615234375, -1.516326904296875, -1.44384765625, -1.371368408203125, -1.29888916015625, -1.226409912109375, -1.1539306640625, -1.081451416015625, -1.00897216796875, -0.936492919921875, -0.864013671875, -0.791534423828125, -0.71905517578125, -0.646575927734375, -0.5740966796875, -0.501617431640625, -0.42913818359375, -0.356658935546875, -0.2841796875, -0.211700439453125, -0.13922119140625, -0.066741943359375, 0.0057373046875, 0.078216552734375, 0.15069580078125, 0.223175048828125, 0.295654296875, 0.368133544921875, 0.44061279296875, 0.513092041015625, 0.5855712890625, 0.658050537109375, 0.73052978515625, 0.803009033203125, 0.87548828125, 0.947967529296875, 1.02044677734375, 1.092926025390625, 1.1654052734375, 1.237884521484375, 1.31036376953125, 1.382843017578125, 1.455322265625, 1.527801513671875, 1.60028076171875, 1.672760009765625, 1.7452392578125, 1.817718505859375, 1.89019775390625, 1.962677001953125, 2.03515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 8.0, 7.0, 15.0, 6.0, 14.0, 21.0, 34.0, 43.0, 58.0, 105.0, 177.0, 288.0, 432.0, 665.0, 722.0, 551.0, 366.0, 220.0, 122.0, 68.0, 52.0, 33.0, 11.0, 16.0, 5.0, 10.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.921417236328125, -1.85064697265625, -1.779876708984375, -1.7091064453125, -1.638336181640625, -1.56756591796875, -1.496795654296875, -1.426025390625, -1.355255126953125, -1.28448486328125, -1.213714599609375, -1.1429443359375, -1.072174072265625, -1.00140380859375, -0.930633544921875, -0.85986328125, -0.789093017578125, -0.71832275390625, -0.647552490234375, -0.5767822265625, -0.506011962890625, -0.43524169921875, -0.364471435546875, -0.293701171875, -0.222930908203125, -0.15216064453125, -0.081390380859375, -0.0106201171875, 0.060150146484375, 0.13092041015625, 0.201690673828125, 0.2724609375, 0.343231201171875, 0.41400146484375, 0.484771728515625, 0.5555419921875, 0.626312255859375, 0.69708251953125, 0.767852783203125, 0.838623046875, 0.909393310546875, 0.98016357421875, 1.050933837890625, 1.1217041015625, 1.192474365234375, 1.26324462890625, 1.334014892578125, 1.40478515625, 1.475555419921875, 1.54632568359375, 1.617095947265625, 1.6878662109375, 1.758636474609375, 1.82940673828125, 1.900177001953125, 1.970947265625, 2.041717529296875, 2.11248779296875, 2.183258056640625, 2.2540283203125, 2.324798583984375, 2.39556884765625, 2.466339111328125, 2.537109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 7.0, 11.0, 28.0, 122.0, 342.0, 328.0, 128.0, 14.0, 10.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.348331451416016, -27.05377769470215, -25.75922393798828, -24.464670181274414, -23.170116424560547, -21.875564575195312, -20.581010818481445, -19.286457061767578, -17.99190330505371, -16.697349548339844, -15.402795791625977, -14.108242988586426, -12.813689231872559, -11.519135475158691, -10.22458267211914, -8.930028915405273, -7.635475158691406, -6.340921401977539, -5.04636812210083, -3.751814603805542, -2.457261085510254, -1.1627073287963867, 0.13184595108032227, 1.4263992309570312, 2.7209529876708984, 4.015506744384766, 5.310060024261475, 6.604613304138184, 7.899167060852051, 9.193720817565918, 10.488273620605469, 11.782827377319336, 13.077377319335938, 14.371931076049805, 15.666484832763672, 16.96103858947754, 18.255592346191406, 19.55014419555664, 20.844697952270508, 22.139251708984375, 23.433805465698242, 24.72835922241211, 26.022912979125977, 27.317466735839844, 28.612018585205078, 29.906574249267578, 31.201126098632812, 32.49568176269531, 33.79023361206055, 35.08478546142578, 36.37934112548828, 37.673892974853516, 38.968448638916016, 40.26300048828125, 41.55755615234375, 42.852108001708984, 44.14665985107422, 45.44121170043945, 46.73576736450195, 48.03031921386719, 49.32487487792969, 50.61942672729492, 51.91398239135742, 53.208534240722656, 54.503089904785156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 8.0, 13.0, 11.0, 23.0, 25.0, 20.0, 34.0, 26.0, 25.0, 42.0, 41.0, 50.0, 40.0, 55.0, 54.0, 52.0, 40.0, 53.0, 48.0, 35.0, 47.0, 39.0, 31.0, 30.0, 25.0, 24.0, 17.0, 19.0, 15.0, 17.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.662504196166992, -9.341949462890625, -9.021394729614258, -8.70083999633789, -8.380285263061523, -8.059730529785156, -7.739176273345947, -7.418622016906738, -7.098067283630371, -6.777512550354004, -6.456957817077637, -6.1364030838012695, -5.8158488273620605, -5.495294094085693, -5.174739360809326, -4.854185104370117, -4.533629894256592, -4.213075160980225, -3.8925206661224365, -3.5719659328460693, -3.2514114379882812, -2.930856704711914, -2.610301971435547, -2.289747476577759, -1.9691927433013916, -1.648638129234314, -1.3280835151672363, -1.0075287818908691, -0.6869741678237915, -0.36641955375671387, -0.04586482048034668, 0.2746896743774414, 0.5952444076538086, 0.9157990217208862, 1.2363536357879639, 1.556908369064331, 1.8774629831314087, 2.1980175971984863, 2.5185723304748535, 2.8391268253326416, 3.159681558609009, 3.480236291885376, 3.800790786743164, 4.121345520019531, 4.441900253295898, 4.762454986572266, 5.083009719848633, 5.403563976287842, 5.724118709564209, 6.044673442840576, 6.365228176116943, 6.685782432556152, 7.0063371658325195, 7.326891899108887, 7.647446632385254, 7.968001365661621, 8.288556098937988, 8.609110832214355, 8.929665565490723, 9.25022029876709, 9.570775032043457, 9.891328811645508, 10.211883544921875, 10.532438278198242, 10.85299301147461]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 12.0, 24.0, 22.0, 53.0, 85.0, 152.0, 231.0, 357.0, 576.0, 975.0, 1622.0, 3056.0, 5716.0, 10755.0, 21035.0, 42981.0, 88185.0, 167579.0, 243458.0, 213388.0, 123941.0, 61940.0, 30112.0, 14929.0, 7741.0, 4125.0, 2280.0, 1268.0, 739.0, 438.0, 300.0, 179.0, 114.0, 65.0, 41.0, 30.0, 15.0, 11.0, 4.0, 3.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0078125, -0.97393798828125, -0.9400634765625, -0.90618896484375, -0.872314453125, -0.83843994140625, -0.8045654296875, -0.77069091796875, -0.73681640625, -0.70294189453125, -0.6690673828125, -0.63519287109375, -0.601318359375, -0.56744384765625, -0.5335693359375, -0.49969482421875, -0.4658203125, -0.43194580078125, -0.3980712890625, -0.36419677734375, -0.330322265625, -0.29644775390625, -0.2625732421875, -0.22869873046875, -0.19482421875, -0.16094970703125, -0.1270751953125, -0.09320068359375, -0.059326171875, -0.02545166015625, 0.0084228515625, 0.04229736328125, 0.076171875, 0.11004638671875, 0.1439208984375, 0.17779541015625, 0.211669921875, 0.24554443359375, 0.2794189453125, 0.31329345703125, 0.34716796875, 0.38104248046875, 0.4149169921875, 0.44879150390625, 0.482666015625, 0.51654052734375, 0.5504150390625, 0.58428955078125, 0.6181640625, 0.65203857421875, 0.6859130859375, 0.71978759765625, 0.753662109375, 0.78753662109375, 0.8214111328125, 0.85528564453125, 0.88916015625, 0.92303466796875, 0.9569091796875, 0.99078369140625, 1.024658203125, 1.05853271484375, 1.0924072265625, 1.12628173828125, 1.16015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 7.0, 10.0, 13.0, 10.0, 16.0, 21.0, 25.0, 35.0, 27.0, 37.0, 27.0, 30.0, 40.0, 41.0, 41.0, 43.0, 43.0, 49.0, 51.0, 50.0, 44.0, 48.0, 33.0, 25.0, 27.0, 27.0, 31.0, 24.0, 20.0, 17.0, 11.0, 9.0, 13.0, 7.0, 8.0, 5.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.841796875, -0.815704345703125, -0.78961181640625, -0.763519287109375, -0.7374267578125, -0.711334228515625, -0.68524169921875, -0.659149169921875, -0.633056640625, -0.606964111328125, -0.58087158203125, -0.554779052734375, -0.5286865234375, -0.502593994140625, -0.47650146484375, -0.450408935546875, -0.42431640625, -0.398223876953125, -0.37213134765625, -0.346038818359375, -0.3199462890625, -0.293853759765625, -0.26776123046875, -0.241668701171875, -0.215576171875, -0.189483642578125, -0.16339111328125, -0.137298583984375, -0.1112060546875, -0.085113525390625, -0.05902099609375, -0.032928466796875, -0.0068359375, 0.019256591796875, 0.04534912109375, 0.071441650390625, 0.0975341796875, 0.123626708984375, 0.14971923828125, 0.175811767578125, 0.201904296875, 0.227996826171875, 0.25408935546875, 0.280181884765625, 0.3062744140625, 0.332366943359375, 0.35845947265625, 0.384552001953125, 0.41064453125, 0.436737060546875, 0.46282958984375, 0.488922119140625, 0.5150146484375, 0.541107177734375, 0.56719970703125, 0.593292236328125, 0.619384765625, 0.645477294921875, 0.67156982421875, 0.697662353515625, 0.7237548828125, 0.749847412109375, 0.77593994140625, 0.802032470703125, 0.828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 4.0, 12.0, 7.0, 13.0, 16.0, 20.0, 28.0, 22.0, 49.0, 95.0, 133.0, 272.0, 541.0, 1332.0, 3918.0, 15196.0, 76798.0, 547081.0, 325421.0, 59617.0, 12322.0, 3379.0, 1162.0, 422.0, 229.0, 137.0, 105.0, 66.0, 40.0, 29.0, 21.0, 14.0, 15.0, 10.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.46331787109375, -2.3836669921875, -2.30401611328125, -2.224365234375, -2.14471435546875, -2.0650634765625, -1.98541259765625, -1.90576171875, -1.82611083984375, -1.7464599609375, -1.66680908203125, -1.587158203125, -1.50750732421875, -1.4278564453125, -1.34820556640625, -1.2685546875, -1.18890380859375, -1.1092529296875, -1.02960205078125, -0.949951171875, -0.87030029296875, -0.7906494140625, -0.71099853515625, -0.63134765625, -0.55169677734375, -0.4720458984375, -0.39239501953125, -0.312744140625, -0.23309326171875, -0.1534423828125, -0.07379150390625, 0.005859375, 0.08551025390625, 0.1651611328125, 0.24481201171875, 0.324462890625, 0.40411376953125, 0.4837646484375, 0.56341552734375, 0.64306640625, 0.72271728515625, 0.8023681640625, 0.88201904296875, 0.961669921875, 1.04132080078125, 1.1209716796875, 1.20062255859375, 1.2802734375, 1.35992431640625, 1.4395751953125, 1.51922607421875, 1.598876953125, 1.67852783203125, 1.7581787109375, 1.83782958984375, 1.91748046875, 1.99713134765625, 2.0767822265625, 2.15643310546875, 2.236083984375, 2.31573486328125, 2.3953857421875, 2.47503662109375, 2.5546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 9.0, 5.0, 8.0, 14.0, 13.0, 19.0, 13.0, 26.0, 35.0, 39.0, 46.0, 37.0, 62.0, 52.0, 59.0, 66.0, 62.0, 56.0, 59.0, 52.0, 50.0, 27.0, 35.0, 27.0, 19.0, 20.0, 15.0, 15.0, 11.0, 14.0, 11.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.1875, -4.071258544921875, -3.95501708984375, -3.838775634765625, -3.7225341796875, -3.606292724609375, -3.49005126953125, -3.373809814453125, -3.257568359375, -3.141326904296875, -3.02508544921875, -2.908843994140625, -2.7926025390625, -2.676361083984375, -2.56011962890625, -2.443878173828125, -2.32763671875, -2.211395263671875, -2.09515380859375, -1.978912353515625, -1.8626708984375, -1.746429443359375, -1.63018798828125, -1.513946533203125, -1.397705078125, -1.281463623046875, -1.16522216796875, -1.048980712890625, -0.9327392578125, -0.816497802734375, -0.70025634765625, -0.584014892578125, -0.4677734375, -0.351531982421875, -0.23529052734375, -0.119049072265625, -0.0028076171875, 0.113433837890625, 0.22967529296875, 0.345916748046875, 0.462158203125, 0.578399658203125, 0.69464111328125, 0.810882568359375, 0.9271240234375, 1.043365478515625, 1.15960693359375, 1.275848388671875, 1.39208984375, 1.508331298828125, 1.62457275390625, 1.740814208984375, 1.8570556640625, 1.973297119140625, 2.08953857421875, 2.205780029296875, 2.322021484375, 2.438262939453125, 2.55450439453125, 2.670745849609375, 2.7869873046875, 2.903228759765625, 3.01947021484375, 3.135711669921875, 3.251953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 13.0, 9.0, 10.0, 23.0, 31.0, 42.0, 68.0, 78.0, 127.0, 222.0, 357.0, 564.0, 1002.0, 1929.0, 3977.0, 8952.0, 22583.0, 62492.0, 182952.0, 512621.0, 160211.0, 54695.0, 19602.0, 8070.0, 3629.0, 1831.0, 988.0, 548.0, 330.0, 209.0, 120.0, 81.0, 66.0, 39.0, 23.0, 21.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.591796875, -0.5750961303710938, -0.5583953857421875, -0.5416946411132812, -0.524993896484375, -0.5082931518554688, -0.4915924072265625, -0.47489166259765625, -0.45819091796875, -0.44149017333984375, -0.4247894287109375, -0.40808868408203125, -0.391387939453125, -0.37468719482421875, -0.3579864501953125, -0.34128570556640625, -0.3245849609375, -0.30788421630859375, -0.2911834716796875, -0.27448272705078125, -0.257781982421875, -0.24108123779296875, -0.2243804931640625, -0.20767974853515625, -0.19097900390625, -0.17427825927734375, -0.1575775146484375, -0.14087677001953125, -0.124176025390625, -0.10747528076171875, -0.0907745361328125, -0.07407379150390625, -0.057373046875, -0.04067230224609375, -0.0239715576171875, -0.00727081298828125, 0.009429931640625, 0.02613067626953125, 0.0428314208984375, 0.05953216552734375, 0.07623291015625, 0.09293365478515625, 0.1096343994140625, 0.12633514404296875, 0.143035888671875, 0.15973663330078125, 0.1764373779296875, 0.19313812255859375, 0.2098388671875, 0.22653961181640625, 0.2432403564453125, 0.25994110107421875, 0.276641845703125, 0.29334259033203125, 0.3100433349609375, 0.32674407958984375, 0.34344482421875, 0.36014556884765625, 0.3768463134765625, 0.39354705810546875, 0.410247802734375, 0.42694854736328125, 0.4436492919921875, 0.46035003662109375, 0.47705078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 5.0, 11.0, 13.0, 16.0, 42.0, 47.0, 74.0, 126.0, 151.0, 151.0, 120.0, 90.0, 54.0, 35.0, 25.0, 14.0, 6.0, 1.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003600120544433594, -0.000347677618265152, -0.0003353431820869446, -0.0003230087459087372, -0.0003106743097305298, -0.0002983398735523224, -0.000286005437374115, -0.0002736710011959076, -0.0002613365650177002, -0.0002490021288394928, -0.0002366676926612854, -0.000224333256483078, -0.0002119988203048706, -0.0001996643841266632, -0.0001873299479484558, -0.0001749955117702484, -0.00016266107559204102, -0.00015032663941383362, -0.00013799220323562622, -0.00012565776705741882, -0.00011332333087921143, -0.00010098889470100403, -8.865445852279663e-05, -7.632002234458923e-05, -6.398558616638184e-05, -5.165114998817444e-05, -3.931671380996704e-05, -2.6982277631759644e-05, -1.4647841453552246e-05, -2.3134052753448486e-06, 1.0021030902862549e-05, 2.2355467081069946e-05, 3.4689903259277344e-05, 4.702433943748474e-05, 5.935877561569214e-05, 7.169321179389954e-05, 8.402764797210693e-05, 9.636208415031433e-05, 0.00010869652032852173, 0.00012103095650672913, 0.00013336539268493652, 0.00014569982886314392, 0.00015803426504135132, 0.00017036870121955872, 0.0001827031373977661, 0.0001950375735759735, 0.0002073720097541809, 0.0002197064459323883, 0.0002320408821105957, 0.0002443753182888031, 0.0002567097544670105, 0.0002690441906452179, 0.0002813786268234253, 0.0002937130630016327, 0.0003060474991798401, 0.0003183819353580475, 0.0003307163715362549, 0.0003430508077144623, 0.0003553852438926697, 0.0003677196800708771, 0.00038005411624908447, 0.00039238855242729187, 0.00040472298860549927, 0.00041705742478370667, 0.00042939186096191406]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 8.0, 9.0, 16.0, 18.0, 31.0, 50.0, 88.0, 174.0, 361.0, 825.0, 2405.0, 8167.0, 37374.0, 219302.0, 642154.0, 109940.0, 19962.0, 4943.0, 1548.0, 571.0, 245.0, 143.0, 78.0, 39.0, 28.0, 26.0, 17.0, 13.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9886016845703125, -0.960601806640625, -0.9326019287109375, -0.90460205078125, -0.8766021728515625, -0.848602294921875, -0.8206024169921875, -0.7926025390625, -0.7646026611328125, -0.736602783203125, -0.7086029052734375, -0.68060302734375, -0.6526031494140625, -0.624603271484375, -0.5966033935546875, -0.568603515625, -0.5406036376953125, -0.512603759765625, -0.4846038818359375, -0.45660400390625, -0.4286041259765625, -0.400604248046875, -0.3726043701171875, -0.3446044921875, -0.3166046142578125, -0.288604736328125, -0.2606048583984375, -0.23260498046875, -0.2046051025390625, -0.176605224609375, -0.1486053466796875, -0.12060546875, -0.0926055908203125, -0.064605712890625, -0.0366058349609375, -0.00860595703125, 0.0193939208984375, 0.047393798828125, 0.0753936767578125, 0.1033935546875, 0.1313934326171875, 0.159393310546875, 0.1873931884765625, 0.21539306640625, 0.2433929443359375, 0.271392822265625, 0.2993927001953125, 0.327392578125, 0.3553924560546875, 0.383392333984375, 0.4113922119140625, 0.43939208984375, 0.4673919677734375, 0.495391845703125, 0.5233917236328125, 0.5513916015625, 0.5793914794921875, 0.607391357421875, 0.6353912353515625, 0.66339111328125, 0.6913909912109375, 0.719390869140625, 0.7473907470703125, 0.775390625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 8.0, 3.0, 7.0, 12.0, 7.0, 21.0, 13.0, 23.0, 31.0, 35.0, 51.0, 48.0, 83.0, 66.0, 81.0, 71.0, 71.0, 55.0, 56.0, 46.0, 48.0, 38.0, 34.0, 25.0, 19.0, 11.0, 11.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83837890625, -0.8147430419921875, -0.791107177734375, -0.7674713134765625, -0.74383544921875, -0.7201995849609375, -0.696563720703125, -0.6729278564453125, -0.6492919921875, -0.6256561279296875, -0.602020263671875, -0.5783843994140625, -0.55474853515625, -0.5311126708984375, -0.507476806640625, -0.4838409423828125, -0.460205078125, -0.4365692138671875, -0.412933349609375, -0.3892974853515625, -0.36566162109375, -0.3420257568359375, -0.318389892578125, -0.2947540283203125, -0.2711181640625, -0.2474822998046875, -0.223846435546875, -0.2002105712890625, -0.17657470703125, -0.1529388427734375, -0.129302978515625, -0.1056671142578125, -0.08203125, -0.0583953857421875, -0.034759521484375, -0.0111236572265625, 0.01251220703125, 0.0361480712890625, 0.059783935546875, 0.0834197998046875, 0.1070556640625, 0.1306915283203125, 0.154327392578125, 0.1779632568359375, 0.20159912109375, 0.2252349853515625, 0.248870849609375, 0.2725067138671875, 0.296142578125, 0.3197784423828125, 0.343414306640625, 0.3670501708984375, 0.39068603515625, 0.4143218994140625, 0.437957763671875, 0.4615936279296875, 0.4852294921875, 0.5088653564453125, 0.532501220703125, 0.5561370849609375, 0.57977294921875, 0.6034088134765625, 0.627044677734375, 0.6506805419921875, 0.67431640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 10.0, 19.0, 20.0, 38.0, 55.0, 86.0, 129.0, 216.0, 124.0, 100.0, 68.0, 37.0, 22.0, 14.0, 15.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.267129898071289, -14.783132553100586, -14.2991361618042, -13.815138816833496, -13.33114242553711, -12.847145080566406, -12.363147735595703, -11.879151344299316, -11.39515495300293, -10.911157608032227, -10.42716121673584, -9.943163871765137, -9.45916748046875, -8.975170135498047, -8.491172790527344, -8.007176399230957, -7.523179054260254, -7.039182186126709, -6.555185317993164, -6.071187973022461, -5.587191581726074, -5.103194236755371, -4.619197368621826, -4.135200500488281, -3.6512036323547363, -3.1672067642211914, -2.6832098960876465, -2.1992127895355225, -1.7152159214019775, -1.2312190532684326, -0.7472219467163086, -0.26322507858276367, 0.22077178955078125, 0.704768717288971, 1.1887656450271606, 1.6727626323699951, 2.15675950050354, 2.640756368637085, 3.124753475189209, 3.608750343322754, 4.092747211456299, 4.576744079589844, 5.060740947723389, 5.544737815856934, 6.028735160827637, 6.512731552124023, 6.996728897094727, 7.4807257652282715, 7.964722633361816, 8.44871997833252, 8.932716369628906, 9.41671371459961, 9.900710105895996, 10.3847074508667, 10.868703842163086, 11.352701187133789, 11.836698532104492, 12.320695877075195, 12.804692268371582, 13.288689613342285, 13.772686004638672, 14.256683349609375, 14.740680694580078, 15.224677085876465, 15.708673477172852]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 8.0, 9.0, 12.0, 17.0, 16.0, 15.0, 19.0, 29.0, 26.0, 41.0, 53.0, 48.0, 65.0, 91.0, 91.0, 79.0, 56.0, 31.0, 43.0, 40.0, 25.0, 32.0, 28.0, 19.0, 11.0, 18.0, 12.0, 15.0, 8.0, 7.0, 4.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.069927215576172, -14.602636337280273, -14.135345458984375, -13.668054580688477, -13.200763702392578, -12.73347282409668, -12.266181945800781, -11.7988920211792, -11.3316011428833, -10.864310264587402, -10.397019386291504, -9.929728507995605, -9.462437629699707, -8.995147705078125, -8.527856826782227, -8.060565948486328, -7.5932745933532715, -7.125983715057373, -6.658692836761475, -6.191402435302734, -5.724111557006836, -5.2568206787109375, -4.789529800415039, -4.322238922119141, -3.8549482822418213, -3.387657403945923, -2.9203667640686035, -2.453075885772705, -1.9857851266860962, -1.5184943675994873, -1.0512034893035889, -0.5839128494262695, -0.1166219711303711, 0.3506688177585602, 0.8179596066474915, 1.2852504253387451, 1.752541184425354, 2.219831943511963, 2.6871228218078613, 3.1544134616851807, 3.621704339981079, 4.088994979858398, 4.556285858154297, 5.023576736450195, 5.490867614746094, 5.958158493041992, 6.425449371337891, 6.892739772796631, 7.360030651092529, 7.827321529388428, 8.294611930847168, 8.761902809143066, 9.229193687438965, 9.696484565734863, 10.163775444030762, 10.63106632232666, 11.098357200622559, 11.565648078918457, 12.032938957214355, 12.500229835510254, 12.967520713806152, 13.434810638427734, 13.902101516723633, 14.369392395019531, 14.83668327331543]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 2.0, 4.0, 11.0, 7.0, 15.0, 14.0, 28.0, 42.0, 61.0, 78.0, 143.0, 223.0, 348.0, 602.0, 1115.0, 2324.0, 4762.0, 11598.0, 32795.0, 116644.0, 467103.0, 1492373.0, 1454243.0, 448417.0, 110703.0, 30575.0, 10702.0, 4589.0, 2142.0, 1051.0, 593.0, 363.0, 220.0, 135.0, 74.0, 59.0, 39.0, 28.0, 17.0, 10.0, 7.0, 11.0, 5.0, 5.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6577529907226562, -0.6314239501953125, -0.6050949096679688, -0.578765869140625, -0.5524368286132812, -0.5261077880859375, -0.49977874755859375, -0.47344970703125, -0.44712066650390625, -0.4207916259765625, -0.39446258544921875, -0.368133544921875, -0.34180450439453125, -0.3154754638671875, -0.28914642333984375, -0.2628173828125, -0.23648834228515625, -0.2101593017578125, -0.18383026123046875, -0.157501220703125, -0.13117218017578125, -0.1048431396484375, -0.07851409912109375, -0.05218505859375, -0.02585601806640625, 0.0004730224609375, 0.02680206298828125, 0.053131103515625, 0.07946014404296875, 0.1057891845703125, 0.13211822509765625, 0.158447265625, 0.18477630615234375, 0.2111053466796875, 0.23743438720703125, 0.263763427734375, 0.29009246826171875, 0.3164215087890625, 0.34275054931640625, 0.36907958984375, 0.39540863037109375, 0.4217376708984375, 0.44806671142578125, 0.474395751953125, 0.5007247924804688, 0.5270538330078125, 0.5533828735351562, 0.5797119140625, 0.6060409545898438, 0.6323699951171875, 0.6586990356445312, 0.685028076171875, 0.7113571166992188, 0.7376861572265625, 0.7640151977539062, 0.79034423828125, 0.8166732788085938, 0.8430023193359375, 0.8693313598632812, 0.895660400390625, 0.9219894409179688, 0.9483184814453125, 0.9746475219726562, 1.0009765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 5.0, 8.0, 9.0, 8.0, 8.0, 9.0, 15.0, 18.0, 24.0, 27.0, 31.0, 26.0, 34.0, 27.0, 31.0, 29.0, 38.0, 37.0, 39.0, 49.0, 47.0, 43.0, 34.0, 43.0, 50.0, 35.0, 33.0, 26.0, 32.0, 21.0, 24.0, 29.0, 18.0, 13.0, 11.0, 6.0, 12.0, 9.0, 11.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73193359375, -0.70849609375, -0.68505859375, -0.66162109375, -0.63818359375, -0.61474609375, -0.59130859375, -0.56787109375, -0.54443359375, -0.52099609375, -0.49755859375, -0.47412109375, -0.45068359375, -0.42724609375, -0.40380859375, -0.38037109375, -0.35693359375, -0.33349609375, -0.31005859375, -0.28662109375, -0.26318359375, -0.23974609375, -0.21630859375, -0.19287109375, -0.16943359375, -0.14599609375, -0.12255859375, -0.09912109375, -0.07568359375, -0.05224609375, -0.02880859375, -0.00537109375, 0.01806640625, 0.04150390625, 0.06494140625, 0.08837890625, 0.11181640625, 0.13525390625, 0.15869140625, 0.18212890625, 0.20556640625, 0.22900390625, 0.25244140625, 0.27587890625, 0.29931640625, 0.32275390625, 0.34619140625, 0.36962890625, 0.39306640625, 0.41650390625, 0.43994140625, 0.46337890625, 0.48681640625, 0.51025390625, 0.53369140625, 0.55712890625, 0.58056640625, 0.60400390625, 0.62744140625, 0.65087890625, 0.67431640625, 0.69775390625, 0.72119140625, 0.74462890625, 0.76806640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 3.0, 4.0, 16.0, 20.0, 40.0, 93.0, 164.0, 382.0, 1391.0, 13601.0, 1830684.0, 2330377.0, 15383.0, 1437.0, 356.0, 161.0, 98.0, 41.0, 17.0, 13.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.318359375, -3.180206298828125, -3.04205322265625, -2.903900146484375, -2.7657470703125, -2.627593994140625, -2.48944091796875, -2.351287841796875, -2.213134765625, -2.074981689453125, -1.93682861328125, -1.798675537109375, -1.6605224609375, -1.522369384765625, -1.38421630859375, -1.246063232421875, -1.10791015625, -0.969757080078125, -0.83160400390625, -0.693450927734375, -0.5552978515625, -0.417144775390625, -0.27899169921875, -0.140838623046875, -0.002685546875, 0.135467529296875, 0.27362060546875, 0.411773681640625, 0.5499267578125, 0.688079833984375, 0.82623291015625, 0.964385986328125, 1.1025390625, 1.240692138671875, 1.37884521484375, 1.516998291015625, 1.6551513671875, 1.793304443359375, 1.93145751953125, 2.069610595703125, 2.207763671875, 2.345916748046875, 2.48406982421875, 2.622222900390625, 2.7603759765625, 2.898529052734375, 3.03668212890625, 3.174835205078125, 3.31298828125, 3.451141357421875, 3.58929443359375, 3.727447509765625, 3.8656005859375, 4.003753662109375, 4.14190673828125, 4.280059814453125, 4.418212890625, 4.556365966796875, 4.69451904296875, 4.832672119140625, 4.9708251953125, 5.108978271484375, 5.24713134765625, 5.385284423828125, 5.5234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 14.0, 19.0, 38.0, 44.0, 70.0, 161.0, 244.0, 478.0, 777.0, 849.0, 595.0, 355.0, 156.0, 76.0, 73.0, 50.0, 26.0, 10.0, 7.0, 13.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0], "bins": [-4.01171875, -3.926544189453125, -3.84136962890625, -3.756195068359375, -3.6710205078125, -3.585845947265625, -3.50067138671875, -3.415496826171875, -3.330322265625, -3.245147705078125, -3.15997314453125, -3.074798583984375, -2.9896240234375, -2.904449462890625, -2.81927490234375, -2.734100341796875, -2.64892578125, -2.563751220703125, -2.47857666015625, -2.393402099609375, -2.3082275390625, -2.223052978515625, -2.13787841796875, -2.052703857421875, -1.967529296875, -1.882354736328125, -1.79718017578125, -1.712005615234375, -1.6268310546875, -1.541656494140625, -1.45648193359375, -1.371307373046875, -1.2861328125, -1.200958251953125, -1.11578369140625, -1.030609130859375, -0.9454345703125, -0.860260009765625, -0.77508544921875, -0.689910888671875, -0.604736328125, -0.519561767578125, -0.43438720703125, -0.349212646484375, -0.2640380859375, -0.178863525390625, -0.09368896484375, -0.008514404296875, 0.07666015625, 0.161834716796875, 0.24700927734375, 0.332183837890625, 0.4173583984375, 0.502532958984375, 0.58770751953125, 0.672882080078125, 0.758056640625, 0.843231201171875, 0.92840576171875, 1.013580322265625, 1.0987548828125, 1.183929443359375, 1.26910400390625, 1.354278564453125, 1.439453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 14.0, 37.0, 72.0, 208.0, 290.0, 195.0, 106.0, 40.0, 14.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.456514358520508, -23.56256675720215, -22.668621063232422, -21.774673461914062, -20.880725860595703, -19.986778259277344, -19.092830657958984, -18.198884963989258, -17.3049373626709, -16.41098976135254, -15.517043113708496, -14.623096466064453, -13.729148864746094, -12.835201263427734, -11.941254615783691, -11.047307968139648, -10.153360366821289, -9.25941276550293, -8.365466117858887, -7.4715189933776855, -6.577571868896484, -5.683624744415283, -4.789677619934082, -3.895730495452881, -3.0017833709716797, -2.1078362464904785, -1.2138891220092773, -0.31994199752807617, 0.574005126953125, 1.4679522514343262, 2.3618993759155273, 3.2558465003967285, 4.149791717529297, 5.043738842010498, 5.937685966491699, 6.8316330909729, 7.725580215454102, 8.619527816772461, 9.513474464416504, 10.407421112060547, 11.301368713378906, 12.195316314697266, 13.089262962341309, 13.983209609985352, 14.877157211303711, 15.77110481262207, 16.665050506591797, 17.558998107910156, 18.452945709228516, 19.346893310546875, 20.240840911865234, 21.13478660583496, 22.02873420715332, 22.92268180847168, 23.816627502441406, 24.710575103759766, 25.604522705078125, 26.498470306396484, 27.392417907714844, 28.28636360168457, 29.18031120300293, 30.07425880432129, 30.968204498291016, 31.862152099609375, 32.756099700927734]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 7.0, 4.0, 9.0, 14.0, 11.0, 10.0, 13.0, 17.0, 28.0, 24.0, 15.0, 28.0, 29.0, 24.0, 24.0, 57.0, 47.0, 37.0, 32.0, 43.0, 42.0, 42.0, 43.0, 42.0, 36.0, 46.0, 43.0, 31.0, 28.0, 32.0, 29.0, 25.0, 15.0, 11.0, 5.0, 17.0, 16.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.94741678237915, -7.677839279174805, -7.408262252807617, -7.1386847496032715, -6.869107246398926, -6.599530220031738, -6.329952716827393, -6.060375213623047, -5.790798187255859, -5.521220684051514, -5.251643657684326, -4.9820661544799805, -4.712488651275635, -4.442911148071289, -4.173334121704102, -3.903756618499756, -3.63417911529541, -3.3646018505096436, -3.095024347305298, -2.8254470825195312, -2.5558695793151855, -2.286292314529419, -2.0167150497436523, -1.7471376657485962, -1.47756028175354, -1.2079828977584839, -0.9384055733680725, -0.6688282489776611, -0.399250864982605, -0.12967348098754883, 0.13990378379821777, 0.4094811677932739, 0.6790590286254883, 0.9486364126205444, 1.2182137966156006, 1.4877910614013672, 1.7573684453964233, 2.0269458293914795, 2.296523094177246, 2.566100597381592, 2.8356778621673584, 3.105255126953125, 3.3748326301574707, 3.6444098949432373, 3.913987159729004, 4.18356466293335, 4.453142166137695, 4.722719192504883, 4.9922966957092285, 5.261874198913574, 5.531451225280762, 5.801028728485107, 6.070606231689453, 6.340183258056641, 6.609760761260986, 6.879338264465332, 7.1489152908325195, 7.418492794036865, 7.688069820404053, 7.957647323608398, 8.227224349975586, 8.49680233001709, 8.766379356384277, 9.035956382751465, 9.305534362792969]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 1.0, 13.0, 5.0, 18.0, 18.0, 35.0, 77.0, 103.0, 177.0, 266.0, 459.0, 835.0, 1529.0, 2833.0, 5593.0, 11086.0, 23603.0, 49528.0, 105862.0, 214314.0, 282944.0, 182519.0, 87214.0, 40688.0, 19363.0, 9294.0, 4708.0, 2316.0, 1331.0, 735.0, 456.0, 248.0, 131.0, 80.0, 61.0, 43.0, 29.0, 21.0, 5.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2621688842773438, -1.2264862060546875, -1.1908035278320312, -1.155120849609375, -1.1194381713867188, -1.0837554931640625, -1.0480728149414062, -1.01239013671875, -0.9767074584960938, -0.9410247802734375, -0.9053421020507812, -0.869659423828125, -0.8339767456054688, -0.7982940673828125, -0.7626113891601562, -0.7269287109375, -0.6912460327148438, -0.6555633544921875, -0.6198806762695312, -0.584197998046875, -0.5485153198242188, -0.5128326416015625, -0.47714996337890625, -0.44146728515625, -0.40578460693359375, -0.3701019287109375, -0.33441925048828125, -0.298736572265625, -0.26305389404296875, -0.2273712158203125, -0.19168853759765625, -0.156005859375, -0.12032318115234375, -0.0846405029296875, -0.04895782470703125, -0.013275146484375, 0.02240753173828125, 0.0580902099609375, 0.09377288818359375, 0.12945556640625, 0.16513824462890625, 0.2008209228515625, 0.23650360107421875, 0.272186279296875, 0.30786895751953125, 0.3435516357421875, 0.37923431396484375, 0.4149169921875, 0.45059967041015625, 0.4862823486328125, 0.5219650268554688, 0.557647705078125, 0.5933303833007812, 0.6290130615234375, 0.6646957397460938, 0.70037841796875, 0.7360610961914062, 0.7717437744140625, 0.8074264526367188, 0.843109130859375, 0.8787918090820312, 0.9144744873046875, 0.9501571655273438, 0.98583984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 1.0, 8.0, 2.0, 8.0, 6.0, 10.0, 5.0, 12.0, 15.0, 26.0, 18.0, 23.0, 25.0, 20.0, 35.0, 29.0, 32.0, 38.0, 44.0, 40.0, 42.0, 55.0, 47.0, 46.0, 52.0, 45.0, 28.0, 34.0, 46.0, 35.0, 29.0, 21.0, 21.0, 19.0, 20.0, 13.0, 9.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.93017578125, -0.9033966064453125, -0.876617431640625, -0.8498382568359375, -0.82305908203125, -0.7962799072265625, -0.769500732421875, -0.7427215576171875, -0.7159423828125, -0.6891632080078125, -0.662384033203125, -0.6356048583984375, -0.60882568359375, -0.5820465087890625, -0.555267333984375, -0.5284881591796875, -0.501708984375, -0.4749298095703125, -0.448150634765625, -0.4213714599609375, -0.39459228515625, -0.3678131103515625, -0.341033935546875, -0.3142547607421875, -0.2874755859375, -0.2606964111328125, -0.233917236328125, -0.2071380615234375, -0.18035888671875, -0.1535797119140625, -0.126800537109375, -0.1000213623046875, -0.0732421875, -0.0464630126953125, -0.019683837890625, 0.0070953369140625, 0.03387451171875, 0.0606536865234375, 0.087432861328125, 0.1142120361328125, 0.1409912109375, 0.1677703857421875, 0.194549560546875, 0.2213287353515625, 0.24810791015625, 0.2748870849609375, 0.301666259765625, 0.3284454345703125, 0.355224609375, 0.3820037841796875, 0.408782958984375, 0.4355621337890625, 0.46234130859375, 0.4891204833984375, 0.515899658203125, 0.5426788330078125, 0.5694580078125, 0.5962371826171875, 0.623016357421875, 0.6497955322265625, 0.67657470703125, 0.7033538818359375, 0.730133056640625, 0.7569122314453125, 0.78369140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 12.0, 15.0, 15.0, 18.0, 36.0, 45.0, 67.0, 83.0, 150.0, 210.0, 280.0, 439.0, 761.0, 1656.0, 4188.0, 14431.0, 66892.0, 545313.0, 335038.0, 58200.0, 13224.0, 3775.0, 1484.0, 742.0, 477.0, 320.0, 193.0, 126.0, 81.0, 83.0, 45.0, 44.0, 23.0, 19.0, 9.0, 12.0, 7.0, 1.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.076141357421875, -2.00189208984375, -1.927642822265625, -1.8533935546875, -1.779144287109375, -1.70489501953125, -1.630645751953125, -1.556396484375, -1.482147216796875, -1.40789794921875, -1.333648681640625, -1.2593994140625, -1.185150146484375, -1.11090087890625, -1.036651611328125, -0.96240234375, -0.888153076171875, -0.81390380859375, -0.739654541015625, -0.6654052734375, -0.591156005859375, -0.51690673828125, -0.442657470703125, -0.368408203125, -0.294158935546875, -0.21990966796875, -0.145660400390625, -0.0714111328125, 0.002838134765625, 0.07708740234375, 0.151336669921875, 0.2255859375, 0.299835205078125, 0.37408447265625, 0.448333740234375, 0.5225830078125, 0.596832275390625, 0.67108154296875, 0.745330810546875, 0.819580078125, 0.893829345703125, 0.96807861328125, 1.042327880859375, 1.1165771484375, 1.190826416015625, 1.26507568359375, 1.339324951171875, 1.41357421875, 1.487823486328125, 1.56207275390625, 1.636322021484375, 1.7105712890625, 1.784820556640625, 1.85906982421875, 1.933319091796875, 2.007568359375, 2.081817626953125, 2.15606689453125, 2.230316162109375, 2.3045654296875, 2.378814697265625, 2.45306396484375, 2.527313232421875, 2.6015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 12.0, 8.0, 12.0, 12.0, 12.0, 12.0, 26.0, 26.0, 34.0, 36.0, 42.0, 50.0, 60.0, 63.0, 56.0, 66.0, 54.0, 56.0, 54.0, 51.0, 37.0, 38.0, 29.0, 26.0, 31.0, 20.0, 8.0, 16.0, 10.0, 9.0, 7.0, 2.0, 7.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.603515625, -3.481658935546875, -3.35980224609375, -3.237945556640625, -3.1160888671875, -2.994232177734375, -2.87237548828125, -2.750518798828125, -2.628662109375, -2.506805419921875, -2.38494873046875, -2.263092041015625, -2.1412353515625, -2.019378662109375, -1.89752197265625, -1.775665283203125, -1.65380859375, -1.531951904296875, -1.41009521484375, -1.288238525390625, -1.1663818359375, -1.044525146484375, -0.92266845703125, -0.800811767578125, -0.678955078125, -0.557098388671875, -0.43524169921875, -0.313385009765625, -0.1915283203125, -0.069671630859375, 0.05218505859375, 0.174041748046875, 0.2958984375, 0.417755126953125, 0.53961181640625, 0.661468505859375, 0.7833251953125, 0.905181884765625, 1.02703857421875, 1.148895263671875, 1.270751953125, 1.392608642578125, 1.51446533203125, 1.636322021484375, 1.7581787109375, 1.880035400390625, 2.00189208984375, 2.123748779296875, 2.24560546875, 2.367462158203125, 2.48931884765625, 2.611175537109375, 2.7330322265625, 2.854888916015625, 2.97674560546875, 3.098602294921875, 3.220458984375, 3.342315673828125, 3.46417236328125, 3.586029052734375, 3.7078857421875, 3.829742431640625, 3.95159912109375, 4.073455810546875, 4.1953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 13.0, 17.0, 24.0, 36.0, 38.0, 82.0, 95.0, 163.0, 233.0, 402.0, 691.0, 1409.0, 2856.0, 6533.0, 16705.0, 47859.0, 171561.0, 615126.0, 123519.0, 37190.0, 13427.0, 5318.0, 2420.0, 1214.0, 622.0, 332.0, 209.0, 122.0, 107.0, 58.0, 45.0, 33.0, 19.0, 9.0, 9.0, 12.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.486328125, -0.47083282470703125, -0.4553375244140625, -0.43984222412109375, -0.424346923828125, -0.40885162353515625, -0.3933563232421875, -0.37786102294921875, -0.36236572265625, -0.34687042236328125, -0.3313751220703125, -0.31587982177734375, -0.300384521484375, -0.28488922119140625, -0.2693939208984375, -0.25389862060546875, -0.2384033203125, -0.22290802001953125, -0.2074127197265625, -0.19191741943359375, -0.176422119140625, -0.16092681884765625, -0.1454315185546875, -0.12993621826171875, -0.11444091796875, -0.09894561767578125, -0.0834503173828125, -0.06795501708984375, -0.052459716796875, -0.03696441650390625, -0.0214691162109375, -0.00597381591796875, 0.009521484375, 0.02501678466796875, 0.0405120849609375, 0.05600738525390625, 0.071502685546875, 0.08699798583984375, 0.1024932861328125, 0.11798858642578125, 0.13348388671875, 0.14897918701171875, 0.1644744873046875, 0.17996978759765625, 0.195465087890625, 0.21096038818359375, 0.2264556884765625, 0.24195098876953125, 0.2574462890625, 0.27294158935546875, 0.2884368896484375, 0.30393218994140625, 0.319427490234375, 0.33492279052734375, 0.3504180908203125, 0.36591339111328125, 0.38140869140625, 0.39690399169921875, 0.4123992919921875, 0.42789459228515625, 0.443389892578125, 0.45888519287109375, 0.4743804931640625, 0.48987579345703125, 0.50537109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 8.0, 19.0, 15.0, 16.0, 12.0, 24.0, 31.0, 39.0, 41.0, 58.0, 90.0, 92.0, 97.0, 74.0, 73.0, 57.0, 47.0, 30.0, 29.0, 25.0, 24.0, 19.0, 7.0, 16.0, 7.0, 5.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0001785755157470703, -0.00017306208610534668, -0.00016754865646362305, -0.00016203522682189941, -0.00015652179718017578, -0.00015100836753845215, -0.00014549493789672852, -0.00013998150825500488, -0.00013446807861328125, -0.00012895464897155762, -0.00012344121932983398, -0.00011792778968811035, -0.00011241436004638672, -0.00010690093040466309, -0.00010138750076293945, -9.587407112121582e-05, -9.036064147949219e-05, -8.484721183776855e-05, -7.933378219604492e-05, -7.382035255432129e-05, -6.830692291259766e-05, -6.279349327087402e-05, -5.728006362915039e-05, -5.176663398742676e-05, -4.6253204345703125e-05, -4.073977470397949e-05, -3.522634506225586e-05, -2.9712915420532227e-05, -2.4199485778808594e-05, -1.868605613708496e-05, -1.3172626495361328e-05, -7.659196853637695e-06, -2.1457672119140625e-06, 3.3676624298095703e-06, 8.881092071533203e-06, 1.4394521713256836e-05, 1.990795135498047e-05, 2.54213809967041e-05, 3.0934810638427734e-05, 3.644824028015137e-05, 4.1961669921875e-05, 4.747509956359863e-05, 5.2988529205322266e-05, 5.85019588470459e-05, 6.401538848876953e-05, 6.952881813049316e-05, 7.50422477722168e-05, 8.055567741394043e-05, 8.606910705566406e-05, 9.15825366973877e-05, 9.709596633911133e-05, 0.00010260939598083496, 0.0001081228256225586, 0.00011363625526428223, 0.00011914968490600586, 0.0001246631145477295, 0.00013017654418945312, 0.00013568997383117676, 0.0001412034034729004, 0.00014671683311462402, 0.00015223026275634766, 0.0001577436923980713, 0.00016325712203979492, 0.00016877055168151855, 0.0001742839813232422]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 7.0, 4.0, 7.0, 5.0, 25.0, 23.0, 31.0, 67.0, 142.0, 211.0, 370.0, 728.0, 1661.0, 4783.0, 18186.0, 90932.0, 690608.0, 194396.0, 33553.0, 8075.0, 2640.0, 1021.0, 442.0, 242.0, 146.0, 77.0, 54.0, 31.0, 26.0, 11.0, 15.0, 12.0, 11.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.70263671875, -0.6804733276367188, -0.6583099365234375, -0.6361465454101562, -0.613983154296875, -0.5918197631835938, -0.5696563720703125, -0.5474929809570312, -0.52532958984375, -0.5031661987304688, -0.4810028076171875, -0.45883941650390625, -0.436676025390625, -0.41451263427734375, -0.3923492431640625, -0.37018585205078125, -0.3480224609375, -0.32585906982421875, -0.3036956787109375, -0.28153228759765625, -0.259368896484375, -0.23720550537109375, -0.2150421142578125, -0.19287872314453125, -0.17071533203125, -0.14855194091796875, -0.1263885498046875, -0.10422515869140625, -0.082061767578125, -0.05989837646484375, -0.0377349853515625, -0.01557159423828125, 0.006591796875, 0.02875518798828125, 0.0509185791015625, 0.07308197021484375, 0.095245361328125, 0.11740875244140625, 0.1395721435546875, 0.16173553466796875, 0.18389892578125, 0.20606231689453125, 0.2282257080078125, 0.25038909912109375, 0.272552490234375, 0.29471588134765625, 0.3168792724609375, 0.33904266357421875, 0.3612060546875, 0.38336944580078125, 0.4055328369140625, 0.42769622802734375, 0.449859619140625, 0.47202301025390625, 0.4941864013671875, 0.5163497924804688, 0.53851318359375, 0.5606765747070312, 0.5828399658203125, 0.6050033569335938, 0.627166748046875, 0.6493301391601562, 0.6714935302734375, 0.6936569213867188, 0.7158203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 13.0, 14.0, 19.0, 26.0, 30.0, 48.0, 60.0, 86.0, 102.0, 110.0, 119.0, 96.0, 85.0, 46.0, 34.0, 38.0, 19.0, 10.0, 10.0, 14.0, 8.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.5998458862304688, -0.5722503662109375, -0.5446548461914062, -0.517059326171875, -0.48946380615234375, -0.4618682861328125, -0.43427276611328125, -0.40667724609375, -0.37908172607421875, -0.3514862060546875, -0.32389068603515625, -0.296295166015625, -0.26869964599609375, -0.2411041259765625, -0.21350860595703125, -0.1859130859375, -0.15831756591796875, -0.1307220458984375, -0.10312652587890625, -0.075531005859375, -0.04793548583984375, -0.0203399658203125, 0.00725555419921875, 0.03485107421875, 0.06244659423828125, 0.0900421142578125, 0.11763763427734375, 0.145233154296875, 0.17282867431640625, 0.2004241943359375, 0.22801971435546875, 0.255615234375, 0.28321075439453125, 0.3108062744140625, 0.33840179443359375, 0.365997314453125, 0.39359283447265625, 0.4211883544921875, 0.44878387451171875, 0.47637939453125, 0.5039749145507812, 0.5315704345703125, 0.5591659545898438, 0.586761474609375, 0.6143569946289062, 0.6419525146484375, 0.6695480346679688, 0.6971435546875, 0.7247390747070312, 0.7523345947265625, 0.7799301147460938, 0.807525634765625, 0.8351211547851562, 0.8627166748046875, 0.8903121948242188, 0.91790771484375, 0.9455032348632812, 0.9730987548828125, 1.0006942749023438, 1.028289794921875, 1.0558853149414062, 1.0834808349609375, 1.1110763549804688, 1.138671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 13.0, 22.0, 50.0, 83.0, 179.0, 282.0, 127.0, 93.0, 50.0, 32.0, 27.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.155160903930664, -19.598899841308594, -19.04263687133789, -18.48637580871582, -17.930112838745117, -17.373851776123047, -16.817588806152344, -16.261327743530273, -15.70506477355957, -15.148802757263184, -14.592540740966797, -14.03627872467041, -13.480016708374023, -12.923754692077637, -12.36749267578125, -11.81123161315918, -11.254969596862793, -10.698707580566406, -10.14244556427002, -9.586183547973633, -9.029921531677246, -8.47365951538086, -7.917397975921631, -7.361135959625244, -6.804873943328857, -6.248611927032471, -5.692349910736084, -5.1360883712768555, -4.579826354980469, -4.023564338684082, -3.4673023223876953, -2.9110403060913086, -2.3547773361206055, -1.7985153198242188, -1.2422534227371216, -0.6859915256500244, -0.1297295093536377, 0.426532506942749, 0.9827942848205566, 1.5390563011169434, 2.09531831741333, 2.651580333709717, 3.2078423500061035, 3.764104127883911, 4.320365905761719, 4.8766279220581055, 5.432889938354492, 5.989151954650879, 6.545413970947266, 7.101675987243652, 7.657938003540039, 8.214200019836426, 8.770462036132812, 9.3267240524292, 9.882986068725586, 10.439247131347656, 10.99551010131836, 11.551772117614746, 12.108034133911133, 12.66429615020752, 13.220558166503906, 13.776820182800293, 14.33308219909668, 14.88934326171875, 15.445605278015137]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 8.0, 16.0, 12.0, 14.0, 21.0, 18.0, 30.0, 18.0, 17.0, 22.0, 27.0, 29.0, 41.0, 48.0, 67.0, 99.0, 77.0, 61.0, 42.0, 32.0, 37.0, 29.0, 22.0, 27.0, 20.0, 21.0, 23.0, 13.0, 17.0, 10.0, 10.0, 8.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.744348526000977, -9.394092559814453, -9.04383659362793, -8.693581581115723, -8.3433256149292, -7.993069648742676, -7.642813682556152, -7.292558193206787, -6.942302703857422, -6.592046737670898, -6.241791248321533, -5.89153528213501, -5.5412797927856445, -5.191023826599121, -4.840767860412598, -4.490512371063232, -4.140256404876709, -3.7900006771087646, -3.4397449493408203, -3.089488983154297, -2.7392334938049316, -2.388977527618408, -2.038721799850464, -1.6884660720825195, -1.3382103443145752, -0.9879546165466309, -0.6376988291740417, -0.28744304180145264, 0.0628126859664917, 0.41306841373443604, 0.7633242607116699, 1.1135799884796143, 1.4638357162475586, 1.814091444015503, 2.1643471717834473, 2.5146031379699707, 2.864858627319336, 3.2151145935058594, 3.5653703212738037, 3.915626049041748, 4.265881538391113, 4.616137504577637, 4.966392993927002, 5.316648960113525, 5.666904449462891, 6.017160415649414, 6.3674163818359375, 6.717671871185303, 7.067927837371826, 7.41818380355835, 7.768439292907715, 8.118695259094238, 8.468951225280762, 8.819206237792969, 9.169462203979492, 9.519718170166016, 9.869974136352539, 10.220230102539062, 10.570486068725586, 10.920741081237793, 11.270997047424316, 11.62125301361084, 11.971508979797363, 12.32176399230957, 12.672019958496094]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 14.0, 20.0, 20.0, 33.0, 51.0, 58.0, 93.0, 152.0, 254.0, 444.0, 760.0, 1389.0, 2724.0, 5713.0, 13580.0, 35936.0, 102796.0, 307497.0, 858521.0, 1485965.0, 888150.0, 319250.0, 106308.0, 38067.0, 14350.0, 5950.0, 2789.0, 1415.0, 796.0, 439.0, 230.0, 156.0, 111.0, 75.0, 59.0, 36.0, 16.0, 9.0, 18.0, 11.0, 2.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65380859375, -0.63238525390625, -0.6109619140625, -0.58953857421875, -0.568115234375, -0.54669189453125, -0.5252685546875, -0.50384521484375, -0.482421875, -0.46099853515625, -0.4395751953125, -0.41815185546875, -0.396728515625, -0.37530517578125, -0.3538818359375, -0.33245849609375, -0.31103515625, -0.28961181640625, -0.2681884765625, -0.24676513671875, -0.225341796875, -0.20391845703125, -0.1824951171875, -0.16107177734375, -0.1396484375, -0.11822509765625, -0.0968017578125, -0.07537841796875, -0.053955078125, -0.03253173828125, -0.0111083984375, 0.01031494140625, 0.03173828125, 0.05316162109375, 0.0745849609375, 0.09600830078125, 0.117431640625, 0.13885498046875, 0.1602783203125, 0.18170166015625, 0.203125, 0.22454833984375, 0.2459716796875, 0.26739501953125, 0.288818359375, 0.31024169921875, 0.3316650390625, 0.35308837890625, 0.37451171875, 0.39593505859375, 0.4173583984375, 0.43878173828125, 0.460205078125, 0.48162841796875, 0.5030517578125, 0.52447509765625, 0.5458984375, 0.56732177734375, 0.5887451171875, 0.61016845703125, 0.631591796875, 0.65301513671875, 0.6744384765625, 0.69586181640625, 0.71728515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 14.0, 11.0, 9.0, 15.0, 17.0, 25.0, 23.0, 26.0, 36.0, 34.0, 40.0, 43.0, 39.0, 58.0, 53.0, 35.0, 58.0, 43.0, 49.0, 46.0, 46.0, 40.0, 36.0, 30.0, 30.0, 23.0, 24.0, 17.0, 7.0, 14.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0263671875, -0.996856689453125, -0.96734619140625, -0.937835693359375, -0.9083251953125, -0.878814697265625, -0.84930419921875, -0.819793701171875, -0.790283203125, -0.760772705078125, -0.73126220703125, -0.701751708984375, -0.6722412109375, -0.642730712890625, -0.61322021484375, -0.583709716796875, -0.55419921875, -0.524688720703125, -0.49517822265625, -0.465667724609375, -0.4361572265625, -0.406646728515625, -0.37713623046875, -0.347625732421875, -0.318115234375, -0.288604736328125, -0.25909423828125, -0.229583740234375, -0.2000732421875, -0.170562744140625, -0.14105224609375, -0.111541748046875, -0.08203125, -0.052520751953125, -0.02301025390625, 0.006500244140625, 0.0360107421875, 0.065521240234375, 0.09503173828125, 0.124542236328125, 0.154052734375, 0.183563232421875, 0.21307373046875, 0.242584228515625, 0.2720947265625, 0.301605224609375, 0.33111572265625, 0.360626220703125, 0.39013671875, 0.419647216796875, 0.44915771484375, 0.478668212890625, 0.5081787109375, 0.537689208984375, 0.56719970703125, 0.596710205078125, 0.626220703125, 0.655731201171875, 0.68524169921875, 0.714752197265625, 0.7442626953125, 0.773773193359375, 0.80328369140625, 0.832794189453125, 0.8623046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 11.0, 14.0, 19.0, 31.0, 52.0, 73.0, 136.0, 258.0, 653.0, 2227.0, 12227.0, 174795.0, 3723573.0, 261202.0, 14999.0, 2711.0, 671.0, 273.0, 127.0, 58.0, 46.0, 28.0, 22.0, 12.0, 11.0, 5.0, 9.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.46710205078125, -2.3775634765625, -2.28802490234375, -2.198486328125, -2.10894775390625, -2.0194091796875, -1.92987060546875, -1.84033203125, -1.75079345703125, -1.6612548828125, -1.57171630859375, -1.482177734375, -1.39263916015625, -1.3031005859375, -1.21356201171875, -1.1240234375, -1.03448486328125, -0.9449462890625, -0.85540771484375, -0.765869140625, -0.67633056640625, -0.5867919921875, -0.49725341796875, -0.40771484375, -0.31817626953125, -0.2286376953125, -0.13909912109375, -0.049560546875, 0.03997802734375, 0.1295166015625, 0.21905517578125, 0.30859375, 0.39813232421875, 0.4876708984375, 0.57720947265625, 0.666748046875, 0.75628662109375, 0.8458251953125, 0.93536376953125, 1.02490234375, 1.11444091796875, 1.2039794921875, 1.29351806640625, 1.383056640625, 1.47259521484375, 1.5621337890625, 1.65167236328125, 1.7412109375, 1.83074951171875, 1.9202880859375, 2.00982666015625, 2.099365234375, 2.18890380859375, 2.2784423828125, 2.36798095703125, 2.45751953125, 2.54705810546875, 2.6365966796875, 2.72613525390625, 2.815673828125, 2.90521240234375, 2.9947509765625, 3.08428955078125, 3.173828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 5.0, 5.0, 9.0, 4.0, 17.0, 26.0, 42.0, 48.0, 67.0, 100.0, 165.0, 243.0, 353.0, 453.0, 574.0, 570.0, 434.0, 318.0, 217.0, 125.0, 92.0, 61.0, 41.0, 32.0, 17.0, 8.0, 10.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.171875, -2.109588623046875, -2.04730224609375, -1.985015869140625, -1.9227294921875, -1.860443115234375, -1.79815673828125, -1.735870361328125, -1.673583984375, -1.611297607421875, -1.54901123046875, -1.486724853515625, -1.4244384765625, -1.362152099609375, -1.29986572265625, -1.237579345703125, -1.17529296875, -1.113006591796875, -1.05072021484375, -0.988433837890625, -0.9261474609375, -0.863861083984375, -0.80157470703125, -0.739288330078125, -0.677001953125, -0.614715576171875, -0.55242919921875, -0.490142822265625, -0.4278564453125, -0.365570068359375, -0.30328369140625, -0.240997314453125, -0.1787109375, -0.116424560546875, -0.05413818359375, 0.008148193359375, 0.0704345703125, 0.132720947265625, 0.19500732421875, 0.257293701171875, 0.319580078125, 0.381866455078125, 0.44415283203125, 0.506439208984375, 0.5687255859375, 0.631011962890625, 0.69329833984375, 0.755584716796875, 0.81787109375, 0.880157470703125, 0.94244384765625, 1.004730224609375, 1.0670166015625, 1.129302978515625, 1.19158935546875, 1.253875732421875, 1.316162109375, 1.378448486328125, 1.44073486328125, 1.503021240234375, 1.5653076171875, 1.627593994140625, 1.68988037109375, 1.752166748046875, 1.814453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 11.0, 18.0, 34.0, 137.0, 300.0, 331.0, 119.0, 37.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.78962326049805, -55.70196533203125, -54.61430358886719, -53.52664566040039, -52.438987731933594, -51.35132598876953, -50.263668060302734, -49.17600631713867, -48.088348388671875, -47.00069046020508, -45.913028717041016, -44.82537078857422, -43.737709045410156, -42.65005111694336, -41.56239318847656, -40.4747314453125, -39.3870735168457, -38.299415588378906, -37.211753845214844, -36.12409591674805, -35.03643798828125, -33.94877624511719, -32.86111831665039, -31.77345848083496, -30.68579864501953, -29.5981388092041, -28.510478973388672, -27.422821044921875, -26.335161209106445, -25.247501373291016, -24.15984344482422, -23.07218360900879, -21.984525680541992, -20.896865844726562, -19.809207916259766, -18.721548080444336, -17.633888244628906, -16.546228408813477, -15.458569526672363, -14.37091064453125, -13.28325080871582, -12.19559097290039, -11.107932090759277, -10.020273208618164, -8.932613372802734, -7.844954013824463, -6.757294654846191, -5.66963529586792, -4.581975936889648, -3.494316577911377, -2.4066572189331055, -1.318997859954834, -0.2313385009765625, 0.856320858001709, 1.9439802169799805, 3.031639575958252, 4.119298934936523, 5.206958293914795, 6.294617652893066, 7.382277011871338, 8.46993637084961, 9.557596206665039, 10.645255088806152, 11.732913970947266, 12.820573806762695]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 10.0, 4.0, 12.0, 11.0, 10.0, 12.0, 20.0, 27.0, 29.0, 29.0, 43.0, 36.0, 55.0, 48.0, 52.0, 54.0, 47.0, 60.0, 54.0, 49.0, 70.0, 32.0, 42.0, 28.0, 32.0, 23.0, 17.0, 20.0, 13.0, 15.0, 16.0, 11.0, 7.0, 3.0, 0.0, 7.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.378660202026367, -10.024774551391602, -9.670888900756836, -9.31700325012207, -8.963116645812988, -8.609230995178223, -8.255345344543457, -7.901459693908691, -7.547573566436768, -7.193687915802002, -6.839801788330078, -6.4859161376953125, -6.132030487060547, -5.778144359588623, -5.424258708953857, -5.070372581481934, -4.716486930847168, -4.362601280212402, -4.0087151527404785, -3.654829502105713, -3.300943613052368, -2.9470577239990234, -2.593172073364258, -2.239286184310913, -1.8854002952575684, -1.5315144062042236, -1.1776286363601685, -0.8237428665161133, -0.46985697746276855, -0.11597108840942383, 0.2379145622253418, 0.5918004512786865, 0.9456863403320312, 1.299572229385376, 1.6534579992294312, 2.0073437690734863, 2.361229658126831, 2.715115547180176, 3.0690011978149414, 3.422887086868286, 3.776772975921631, 4.1306586265563965, 4.48454475402832, 4.838430404663086, 5.192316055297852, 5.546202182769775, 5.900087833404541, 6.253973960876465, 6.6078596115112305, 6.961745262145996, 7.31563138961792, 7.6695170402526855, 8.02340316772461, 8.377288818359375, 8.73117446899414, 9.085060119628906, 9.438945770263672, 9.792831420898438, 10.146717071533203, 10.500602722167969, 10.85448932647705, 11.208374977111816, 11.562260627746582, 11.916146278381348, 12.27003288269043]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 6.0, 12.0, 17.0, 25.0, 35.0, 48.0, 76.0, 96.0, 151.0, 209.0, 339.0, 429.0, 710.0, 1102.0, 1688.0, 2668.0, 4409.0, 7014.0, 12074.0, 21315.0, 39490.0, 76186.0, 148980.0, 251264.0, 223334.0, 120259.0, 60737.0, 32016.0, 17479.0, 10014.0, 5943.0, 3692.0, 2356.0, 1477.0, 950.0, 663.0, 391.0, 301.0, 165.0, 133.0, 81.0, 67.0, 43.0, 28.0, 19.0, 20.0, 9.0, 6.0, 9.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0384368896484375, -1.003631591796875, -0.9688262939453125, -0.93402099609375, -0.8992156982421875, -0.864410400390625, -0.8296051025390625, -0.7947998046875, -0.7599945068359375, -0.725189208984375, -0.6903839111328125, -0.65557861328125, -0.6207733154296875, -0.585968017578125, -0.5511627197265625, -0.516357421875, -0.4815521240234375, -0.446746826171875, -0.4119415283203125, -0.37713623046875, -0.3423309326171875, -0.307525634765625, -0.2727203369140625, -0.2379150390625, -0.2031097412109375, -0.168304443359375, -0.1334991455078125, -0.09869384765625, -0.0638885498046875, -0.029083251953125, 0.0057220458984375, 0.04052734375, 0.0753326416015625, 0.110137939453125, 0.1449432373046875, 0.17974853515625, 0.2145538330078125, 0.249359130859375, 0.2841644287109375, 0.3189697265625, 0.3537750244140625, 0.388580322265625, 0.4233856201171875, 0.45819091796875, 0.4929962158203125, 0.527801513671875, 0.5626068115234375, 0.597412109375, 0.6322174072265625, 0.667022705078125, 0.7018280029296875, 0.73663330078125, 0.7714385986328125, 0.806243896484375, 0.8410491943359375, 0.8758544921875, 0.9106597900390625, 0.945465087890625, 0.9802703857421875, 1.01507568359375, 1.0498809814453125, 1.084686279296875, 1.1194915771484375, 1.154296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 9.0, 8.0, 12.0, 19.0, 29.0, 25.0, 29.0, 29.0, 33.0, 33.0, 32.0, 32.0, 50.0, 54.0, 55.0, 41.0, 45.0, 44.0, 38.0, 43.0, 26.0, 35.0, 42.0, 31.0, 32.0, 22.0, 24.0, 16.0, 22.0, 15.0, 8.0, 9.0, 6.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93798828125, -0.9094009399414062, -0.8808135986328125, -0.8522262573242188, -0.823638916015625, -0.7950515747070312, -0.7664642333984375, -0.7378768920898438, -0.70928955078125, -0.6807022094726562, -0.6521148681640625, -0.6235275268554688, -0.594940185546875, -0.5663528442382812, -0.5377655029296875, -0.5091781616210938, -0.4805908203125, -0.45200347900390625, -0.4234161376953125, -0.39482879638671875, -0.366241455078125, -0.33765411376953125, -0.3090667724609375, -0.28047943115234375, -0.25189208984375, -0.22330474853515625, -0.1947174072265625, -0.16613006591796875, -0.137542724609375, -0.10895538330078125, -0.0803680419921875, -0.05178070068359375, -0.023193359375, 0.00539398193359375, 0.0339813232421875, 0.06256866455078125, 0.091156005859375, 0.11974334716796875, 0.1483306884765625, 0.17691802978515625, 0.20550537109375, 0.23409271240234375, 0.2626800537109375, 0.29126739501953125, 0.319854736328125, 0.34844207763671875, 0.3770294189453125, 0.40561676025390625, 0.4342041015625, 0.46279144287109375, 0.4913787841796875, 0.5199661254882812, 0.548553466796875, 0.5771408081054688, 0.6057281494140625, 0.6343154907226562, 0.66290283203125, 0.6914901733398438, 0.7200775146484375, 0.7486648559570312, 0.777252197265625, 0.8058395385742188, 0.8344268798828125, 0.8630142211914062, 0.8916015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 9.0, 11.0, 12.0, 26.0, 24.0, 39.0, 48.0, 63.0, 64.0, 128.0, 196.0, 253.0, 405.0, 630.0, 1016.0, 2240.0, 6583.0, 31354.0, 249152.0, 685188.0, 54852.0, 9734.0, 3021.0, 1337.0, 739.0, 442.0, 309.0, 191.0, 132.0, 88.0, 85.0, 51.0, 29.0, 29.0, 19.0, 10.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.930328369140625, -2.83917236328125, -2.748016357421875, -2.6568603515625, -2.565704345703125, -2.47454833984375, -2.383392333984375, -2.292236328125, -2.201080322265625, -2.10992431640625, -2.018768310546875, -1.9276123046875, -1.836456298828125, -1.74530029296875, -1.654144287109375, -1.56298828125, -1.471832275390625, -1.38067626953125, -1.289520263671875, -1.1983642578125, -1.107208251953125, -1.01605224609375, -0.924896240234375, -0.833740234375, -0.742584228515625, -0.65142822265625, -0.560272216796875, -0.4691162109375, -0.377960205078125, -0.28680419921875, -0.195648193359375, -0.1044921875, -0.013336181640625, 0.07781982421875, 0.168975830078125, 0.2601318359375, 0.351287841796875, 0.44244384765625, 0.533599853515625, 0.624755859375, 0.715911865234375, 0.80706787109375, 0.898223876953125, 0.9893798828125, 1.080535888671875, 1.17169189453125, 1.262847900390625, 1.35400390625, 1.445159912109375, 1.53631591796875, 1.627471923828125, 1.7186279296875, 1.809783935546875, 1.90093994140625, 1.992095947265625, 2.083251953125, 2.174407958984375, 2.26556396484375, 2.356719970703125, 2.4478759765625, 2.539031982421875, 2.63018798828125, 2.721343994140625, 2.8125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 7.0, 7.0, 11.0, 13.0, 14.0, 15.0, 28.0, 27.0, 29.0, 36.0, 37.0, 67.0, 45.0, 68.0, 63.0, 49.0, 70.0, 53.0, 59.0, 61.0, 42.0, 27.0, 31.0, 20.0, 22.0, 16.0, 15.0, 8.0, 5.0, 7.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.333099365234375, -3.21502685546875, -3.096954345703125, -2.9788818359375, -2.860809326171875, -2.74273681640625, -2.624664306640625, -2.506591796875, -2.388519287109375, -2.27044677734375, -2.152374267578125, -2.0343017578125, -1.916229248046875, -1.79815673828125, -1.680084228515625, -1.56201171875, -1.443939208984375, -1.32586669921875, -1.207794189453125, -1.0897216796875, -0.971649169921875, -0.85357666015625, -0.735504150390625, -0.617431640625, -0.499359130859375, -0.38128662109375, -0.263214111328125, -0.1451416015625, -0.027069091796875, 0.09100341796875, 0.209075927734375, 0.3271484375, 0.445220947265625, 0.56329345703125, 0.681365966796875, 0.7994384765625, 0.917510986328125, 1.03558349609375, 1.153656005859375, 1.271728515625, 1.389801025390625, 1.50787353515625, 1.625946044921875, 1.7440185546875, 1.862091064453125, 1.98016357421875, 2.098236083984375, 2.21630859375, 2.334381103515625, 2.45245361328125, 2.570526123046875, 2.6885986328125, 2.806671142578125, 2.92474365234375, 3.042816162109375, 3.160888671875, 3.278961181640625, 3.39703369140625, 3.515106201171875, 3.6331787109375, 3.751251220703125, 3.86932373046875, 3.987396240234375, 4.10546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 12.0, 16.0, 19.0, 33.0, 48.0, 80.0, 135.0, 174.0, 327.0, 675.0, 1383.0, 3707.0, 12704.0, 58030.0, 630887.0, 278823.0, 45206.0, 10461.0, 3186.0, 1213.0, 584.0, 312.0, 175.0, 121.0, 77.0, 41.0, 41.0, 18.0, 18.0, 11.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.60968017578125, -0.5899658203125, -0.57025146484375, -0.550537109375, -0.53082275390625, -0.5111083984375, -0.49139404296875, -0.4716796875, -0.45196533203125, -0.4322509765625, -0.41253662109375, -0.392822265625, -0.37310791015625, -0.3533935546875, -0.33367919921875, -0.31396484375, -0.29425048828125, -0.2745361328125, -0.25482177734375, -0.235107421875, -0.21539306640625, -0.1956787109375, -0.17596435546875, -0.15625, -0.13653564453125, -0.1168212890625, -0.09710693359375, -0.077392578125, -0.05767822265625, -0.0379638671875, -0.01824951171875, 0.00146484375, 0.02117919921875, 0.0408935546875, 0.06060791015625, 0.080322265625, 0.10003662109375, 0.1197509765625, 0.13946533203125, 0.1591796875, 0.17889404296875, 0.1986083984375, 0.21832275390625, 0.238037109375, 0.25775146484375, 0.2774658203125, 0.29718017578125, 0.31689453125, 0.33660888671875, 0.3563232421875, 0.37603759765625, 0.395751953125, 0.41546630859375, 0.4351806640625, 0.45489501953125, 0.474609375, 0.49432373046875, 0.5140380859375, 0.53375244140625, 0.553466796875, 0.57318115234375, 0.5928955078125, 0.61260986328125, 0.63232421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 13.0, 20.0, 17.0, 16.0, 34.0, 27.0, 56.0, 73.0, 120.0, 149.0, 110.0, 100.0, 67.0, 43.0, 38.0, 23.0, 17.0, 11.0, 13.0, 12.0, 8.0, 3.0, 3.0, 6.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002951622009277344, -0.00028666481375694275, -0.0002781674265861511, -0.0002696700394153595, -0.00026117265224456787, -0.00025267526507377625, -0.0002441778779029846, -0.000235680490732193, -0.00022718310356140137, -0.00021868571639060974, -0.00021018832921981812, -0.0002016909420490265, -0.00019319355487823486, -0.00018469616770744324, -0.0001761987805366516, -0.00016770139336585999, -0.00015920400619506836, -0.00015070661902427673, -0.0001422092318534851, -0.00013371184468269348, -0.00012521445751190186, -0.00011671707034111023, -0.0001082196831703186, -9.972229599952698e-05, -9.122490882873535e-05, -8.272752165794373e-05, -7.42301344871521e-05, -6.573274731636047e-05, -5.723536014556885e-05, -4.873797297477722e-05, -4.0240585803985596e-05, -3.174319863319397e-05, -2.3245811462402344e-05, -1.4748424291610718e-05, -6.251037120819092e-06, 2.246350049972534e-06, 1.074373722076416e-05, 1.9241124391555786e-05, 2.7738511562347412e-05, 3.623589873313904e-05, 4.4733285903930664e-05, 5.323067307472229e-05, 6.172806024551392e-05, 7.022544741630554e-05, 7.872283458709717e-05, 8.72202217578888e-05, 9.571760892868042e-05, 0.00010421499609947205, 0.00011271238327026367, 0.0001212097704410553, 0.00012970715761184692, 0.00013820454478263855, 0.00014670193195343018, 0.0001551993191242218, 0.00016369670629501343, 0.00017219409346580505, 0.00018069148063659668, 0.0001891888678073883, 0.00019768625497817993, 0.00020618364214897156, 0.00021468102931976318, 0.0002231784164905548, 0.00023167580366134644, 0.00024017319083213806, 0.0002486705780029297]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 12.0, 31.0, 37.0, 78.0, 142.0, 321.0, 743.0, 2207.0, 11218.0, 162717.0, 824099.0, 40001.0, 4629.0, 1319.0, 505.0, 214.0, 115.0, 64.0, 31.0, 22.0, 11.0, 9.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0068740844726562, -0.9756622314453125, -0.9444503784179688, -0.913238525390625, -0.8820266723632812, -0.8508148193359375, -0.8196029663085938, -0.78839111328125, -0.7571792602539062, -0.7259674072265625, -0.6947555541992188, -0.663543701171875, -0.6323318481445312, -0.6011199951171875, -0.5699081420898438, -0.5386962890625, -0.5074844360351562, -0.4762725830078125, -0.44506072998046875, -0.413848876953125, -0.38263702392578125, -0.3514251708984375, -0.32021331787109375, -0.28900146484375, -0.25778961181640625, -0.2265777587890625, -0.19536590576171875, -0.164154052734375, -0.13294219970703125, -0.1017303466796875, -0.07051849365234375, -0.039306640625, -0.00809478759765625, 0.0231170654296875, 0.05432891845703125, 0.085540771484375, 0.11675262451171875, 0.1479644775390625, 0.17917633056640625, 0.21038818359375, 0.24160003662109375, 0.2728118896484375, 0.30402374267578125, 0.335235595703125, 0.36644744873046875, 0.3976593017578125, 0.42887115478515625, 0.4600830078125, 0.49129486083984375, 0.5225067138671875, 0.5537185668945312, 0.584930419921875, 0.6161422729492188, 0.6473541259765625, 0.6785659790039062, 0.70977783203125, 0.7409896850585938, 0.7722015380859375, 0.8034133911132812, 0.834625244140625, 0.8658370971679688, 0.8970489501953125, 0.9282608032226562, 0.95947265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 3.0, 14.0, 11.0, 13.0, 16.0, 20.0, 22.0, 26.0, 55.0, 76.0, 66.0, 117.0, 121.0, 114.0, 93.0, 58.0, 37.0, 30.0, 33.0, 22.0, 11.0, 14.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.724609375, -0.7015380859375, -0.678466796875, -0.6553955078125, -0.63232421875, -0.6092529296875, -0.586181640625, -0.5631103515625, -0.5400390625, -0.5169677734375, -0.493896484375, -0.4708251953125, -0.44775390625, -0.4246826171875, -0.401611328125, -0.3785400390625, -0.35546875, -0.3323974609375, -0.309326171875, -0.2862548828125, -0.26318359375, -0.2401123046875, -0.217041015625, -0.1939697265625, -0.1708984375, -0.1478271484375, -0.124755859375, -0.1016845703125, -0.07861328125, -0.0555419921875, -0.032470703125, -0.0093994140625, 0.013671875, 0.0367431640625, 0.059814453125, 0.0828857421875, 0.10595703125, 0.1290283203125, 0.152099609375, 0.1751708984375, 0.1982421875, 0.2213134765625, 0.244384765625, 0.2674560546875, 0.29052734375, 0.3135986328125, 0.336669921875, 0.3597412109375, 0.3828125, 0.4058837890625, 0.428955078125, 0.4520263671875, 0.47509765625, 0.4981689453125, 0.521240234375, 0.5443115234375, 0.5673828125, 0.5904541015625, 0.613525390625, 0.6365966796875, 0.65966796875, 0.6827392578125, 0.705810546875, 0.7288818359375, 0.751953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 16.0, 13.0, 36.0, 90.0, 145.0, 390.0, 145.0, 82.0, 35.0, 20.0, 14.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.571950912475586, -24.851276397705078, -24.13060188293457, -23.409927368164062, -22.689252853393555, -21.968578338623047, -21.24790382385254, -20.52722930908203, -19.806554794311523, -19.085880279541016, -18.365205764770508, -17.64453125, -16.923856735229492, -16.203182220458984, -15.482507705688477, -14.761833190917969, -14.041158676147461, -13.320484161376953, -12.599809646606445, -11.879135131835938, -11.15846061706543, -10.437786102294922, -9.717111587524414, -8.996437072753906, -8.275762557983398, -7.555088043212891, -6.834413528442383, -6.113739013671875, -5.393064498901367, -4.672389984130859, -3.9517154693603516, -3.2310409545898438, -2.510364532470703, -1.7896900177001953, -1.0690155029296875, -0.3483409881591797, 0.3723335266113281, 1.093008041381836, 1.8136825561523438, 2.5343570709228516, 3.2550315856933594, 3.975706100463867, 4.696380615234375, 5.417055130004883, 6.137729644775391, 6.858404159545898, 7.579078674316406, 8.299753189086914, 9.020427703857422, 9.74110221862793, 10.461776733398438, 11.182451248168945, 11.903125762939453, 12.623800277709961, 13.344474792480469, 14.065149307250977, 14.785823822021484, 15.506498336791992, 16.2271728515625, 16.947847366333008, 17.668521881103516, 18.389196395874023, 19.10987091064453, 19.83054542541504, 20.551219940185547]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 3.0, 7.0, 11.0, 7.0, 8.0, 4.0, 8.0, 13.0, 18.0, 20.0, 29.0, 33.0, 24.0, 22.0, 28.0, 31.0, 41.0, 97.0, 159.0, 85.0, 48.0, 37.0, 33.0, 33.0, 38.0, 21.0, 21.0, 18.0, 7.0, 20.0, 10.0, 13.0, 11.0, 5.0, 11.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.804824829101562, -14.386870384216309, -13.968915939331055, -13.5509614944458, -13.133007049560547, -12.715051651000977, -12.297097206115723, -11.879142761230469, -11.461188316345215, -11.043233871459961, -10.625279426574707, -10.207324981689453, -9.789369583129883, -9.371416091918945, -8.953460693359375, -8.535506248474121, -8.117551803588867, -7.699597358703613, -7.281642913818359, -6.863687992095947, -6.445733547210693, -6.0277791023254395, -5.609824180603027, -5.191869735717773, -4.7739152908325195, -4.355960845947266, -3.9380061626434326, -3.5200514793395996, -3.1020970344543457, -2.684142589569092, -2.266187906265259, -1.8482332229614258, -1.4302787780761719, -1.0123242139816284, -0.594369649887085, -0.1764150857925415, 0.24153947830200195, 0.6594939231872559, 1.0774486064910889, 1.4954032897949219, 1.9133577346801758, 2.3313121795654297, 2.7492668628692627, 3.1672215461730957, 3.5851759910583496, 4.0031304359436035, 4.421085357666016, 4.8390398025512695, 5.256994247436523, 5.674948692321777, 6.092903137207031, 6.510858058929443, 6.928812503814697, 7.346766948699951, 7.764721870422363, 8.182676315307617, 8.600630760192871, 9.018585205078125, 9.436539649963379, 9.854494094848633, 10.272449493408203, 10.69040298461914, 11.108358383178711, 11.526312828063965, 11.944267272949219]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 11.0, 15.0, 25.0, 37.0, 46.0, 57.0, 119.0, 169.0, 216.0, 294.0, 485.0, 744.0, 1196.0, 1882.0, 3250.0, 6333.0, 13605.0, 34103.0, 100166.0, 312023.0, 813019.0, 1400626.0, 928624.0, 376205.0, 125352.0, 42614.0, 16124.0, 7309.0, 3723.0, 2126.0, 1245.0, 824.0, 522.0, 364.0, 256.0, 181.0, 121.0, 77.0, 69.0, 43.0, 19.0, 23.0, 8.0, 12.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.927734375, -0.8992691040039062, -0.8708038330078125, -0.8423385620117188, -0.813873291015625, -0.7854080200195312, -0.7569427490234375, -0.7284774780273438, -0.70001220703125, -0.6715469360351562, -0.6430816650390625, -0.6146163940429688, -0.586151123046875, -0.5576858520507812, -0.5292205810546875, -0.5007553100585938, -0.4722900390625, -0.44382476806640625, -0.4153594970703125, -0.38689422607421875, -0.358428955078125, -0.32996368408203125, -0.3014984130859375, -0.27303314208984375, -0.24456787109375, -0.21610260009765625, -0.1876373291015625, -0.15917205810546875, -0.130706787109375, -0.10224151611328125, -0.0737762451171875, -0.04531097412109375, -0.016845703125, 0.01161956787109375, 0.0400848388671875, 0.06855010986328125, 0.097015380859375, 0.12548065185546875, 0.1539459228515625, 0.18241119384765625, 0.21087646484375, 0.23934173583984375, 0.2678070068359375, 0.29627227783203125, 0.324737548828125, 0.35320281982421875, 0.3816680908203125, 0.41013336181640625, 0.4385986328125, 0.46706390380859375, 0.4955291748046875, 0.5239944458007812, 0.552459716796875, 0.5809249877929688, 0.6093902587890625, 0.6378555297851562, 0.66632080078125, 0.6947860717773438, 0.7232513427734375, 0.7517166137695312, 0.780181884765625, 0.8086471557617188, 0.8371124267578125, 0.8655776977539062, 0.89404296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 11.0, 10.0, 7.0, 7.0, 12.0, 16.0, 21.0, 21.0, 27.0, 26.0, 30.0, 20.0, 33.0, 26.0, 42.0, 51.0, 38.0, 43.0, 48.0, 38.0, 53.0, 43.0, 41.0, 43.0, 36.0, 32.0, 28.0, 29.0, 17.0, 28.0, 22.0, 17.0, 21.0, 12.0, 13.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9287109375, -0.9028244018554688, -0.8769378662109375, -0.8510513305664062, -0.825164794921875, -0.7992782592773438, -0.7733917236328125, -0.7475051879882812, -0.72161865234375, -0.6957321166992188, -0.6698455810546875, -0.6439590454101562, -0.618072509765625, -0.5921859741210938, -0.5662994384765625, -0.5404129028320312, -0.5145263671875, -0.48863983154296875, -0.4627532958984375, -0.43686676025390625, -0.410980224609375, -0.38509368896484375, -0.3592071533203125, -0.33332061767578125, -0.30743408203125, -0.28154754638671875, -0.2556610107421875, -0.22977447509765625, -0.203887939453125, -0.17800140380859375, -0.1521148681640625, -0.12622833251953125, -0.100341796875, -0.07445526123046875, -0.0485687255859375, -0.02268218994140625, 0.003204345703125, 0.02909088134765625, 0.0549774169921875, 0.08086395263671875, 0.10675048828125, 0.13263702392578125, 0.1585235595703125, 0.18441009521484375, 0.210296630859375, 0.23618316650390625, 0.2620697021484375, 0.28795623779296875, 0.3138427734375, 0.33972930908203125, 0.3656158447265625, 0.39150238037109375, 0.417388916015625, 0.44327545166015625, 0.4691619873046875, 0.49504852294921875, 0.52093505859375, 0.5468215942382812, 0.5727081298828125, 0.5985946655273438, 0.624481201171875, 0.6503677368164062, 0.6762542724609375, 0.7021408081054688, 0.72802734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 8.0, 18.0, 20.0, 39.0, 78.0, 154.0, 255.0, 531.0, 1283.0, 3634.0, 34863.0, 3941238.0, 202220.0, 6925.0, 1626.0, 717.0, 296.0, 151.0, 83.0, 57.0, 31.0, 12.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.86358642578125, -5.6842041015625, -5.50482177734375, -5.325439453125, -5.14605712890625, -4.9666748046875, -4.78729248046875, -4.60791015625, -4.42852783203125, -4.2491455078125, -4.06976318359375, -3.890380859375, -3.71099853515625, -3.5316162109375, -3.35223388671875, -3.1728515625, -2.99346923828125, -2.8140869140625, -2.63470458984375, -2.455322265625, -2.27593994140625, -2.0965576171875, -1.91717529296875, -1.73779296875, -1.55841064453125, -1.3790283203125, -1.19964599609375, -1.020263671875, -0.84088134765625, -0.6614990234375, -0.48211669921875, -0.302734375, -0.12335205078125, 0.0560302734375, 0.23541259765625, 0.414794921875, 0.59417724609375, 0.7735595703125, 0.95294189453125, 1.13232421875, 1.31170654296875, 1.4910888671875, 1.67047119140625, 1.849853515625, 2.02923583984375, 2.2086181640625, 2.38800048828125, 2.5673828125, 2.74676513671875, 2.9261474609375, 3.10552978515625, 3.284912109375, 3.46429443359375, 3.6436767578125, 3.82305908203125, 4.00244140625, 4.18182373046875, 4.3612060546875, 4.54058837890625, 4.719970703125, 4.89935302734375, 5.0787353515625, 5.25811767578125, 5.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 21.0, 33.0, 57.0, 75.0, 155.0, 197.0, 373.0, 627.0, 787.0, 638.0, 380.0, 312.0, 149.0, 103.0, 61.0, 37.0, 20.0, 14.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.613983154296875, -3.49163818359375, -3.369293212890625, -3.2469482421875, -3.124603271484375, -3.00225830078125, -2.879913330078125, -2.757568359375, -2.635223388671875, -2.51287841796875, -2.390533447265625, -2.2681884765625, -2.145843505859375, -2.02349853515625, -1.901153564453125, -1.77880859375, -1.656463623046875, -1.53411865234375, -1.411773681640625, -1.2894287109375, -1.167083740234375, -1.04473876953125, -0.922393798828125, -0.800048828125, -0.677703857421875, -0.55535888671875, -0.433013916015625, -0.3106689453125, -0.188323974609375, -0.06597900390625, 0.056365966796875, 0.1787109375, 0.301055908203125, 0.42340087890625, 0.545745849609375, 0.6680908203125, 0.790435791015625, 0.91278076171875, 1.035125732421875, 1.157470703125, 1.279815673828125, 1.40216064453125, 1.524505615234375, 1.6468505859375, 1.769195556640625, 1.89154052734375, 2.013885498046875, 2.13623046875, 2.258575439453125, 2.38092041015625, 2.503265380859375, 2.6256103515625, 2.747955322265625, 2.87030029296875, 2.992645263671875, 3.114990234375, 3.237335205078125, 3.35968017578125, 3.482025146484375, 3.6043701171875, 3.726715087890625, 3.84906005859375, 3.971405029296875, 4.09375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 8.0, 15.0, 18.0, 20.0, 44.0, 68.0, 92.0, 124.0, 162.0, 127.0, 108.0, 66.0, 45.0, 28.0, 17.0, 15.0, 15.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.93829345703125, -32.163124084472656, -31.387950897216797, -30.612781524658203, -29.837610244750977, -29.06243896484375, -28.287269592285156, -27.51209831237793, -26.736927032470703, -25.961755752563477, -25.18658447265625, -24.411415100097656, -23.63624382019043, -22.861072540283203, -22.08590316772461, -21.310731887817383, -20.535560607910156, -19.76038932800293, -18.985218048095703, -18.21004867553711, -17.434877395629883, -16.659706115722656, -15.884535789489746, -15.109365463256836, -14.33419418334961, -13.559022903442383, -12.783852577209473, -12.008682250976562, -11.233510971069336, -10.45833969116211, -9.6831693649292, -8.907999038696289, -8.13282585144043, -7.357655048370361, -6.582484245300293, -5.807313442230225, -5.032142639160156, -4.256971836090088, -3.4818010330200195, -2.706630229949951, -1.9314594268798828, -1.1562886238098145, -0.3811178207397461, 0.39405298233032227, 1.1692237854003906, 1.944394588470459, 2.7195653915405273, 3.4947361946105957, 4.269906997680664, 5.045077800750732, 5.820248603820801, 6.595419406890869, 7.3705902099609375, 8.145761489868164, 8.920931816101074, 9.696102142333984, 10.471273422241211, 11.246444702148438, 12.021615028381348, 12.796785354614258, 13.571956634521484, 14.347127914428711, 15.122298240661621, 15.897468566894531, 16.672639846801758]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 8.0, 11.0, 12.0, 15.0, 17.0, 17.0, 24.0, 27.0, 24.0, 26.0, 23.0, 29.0, 35.0, 31.0, 35.0, 45.0, 52.0, 45.0, 40.0, 45.0, 45.0, 29.0, 35.0, 39.0, 35.0, 34.0, 21.0, 27.0, 25.0, 27.0, 19.0, 16.0, 12.0, 11.0, 8.0, 8.0, 7.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.81635570526123, -12.397385597229004, -11.978415489196777, -11.559446334838867, -11.14047622680664, -10.721506118774414, -10.302536010742188, -9.883565902709961, -9.464595794677734, -9.045625686645508, -8.626655578613281, -8.207685470581055, -7.7887163162231445, -7.369746208190918, -6.950776100158691, -6.531805992126465, -6.112836837768555, -5.693866729736328, -5.27489709854126, -4.855926990509033, -4.436957359313965, -4.017987251281738, -3.5990171432495117, -3.1800472736358643, -2.761077404022217, -2.3421075344085693, -1.9231375455856323, -1.5041675567626953, -1.0851976871490479, -0.6662278175354004, -0.24725770950317383, 0.17171216011047363, 0.5906810760498047, 1.0096509456634521, 1.4286209344863892, 1.8475909233093262, 2.2665607929229736, 2.685530662536621, 3.1045007705688477, 3.523470640182495, 3.9424405097961426, 4.361410617828369, 4.7803802490234375, 5.199350357055664, 5.618320465087891, 6.037290096282959, 6.4562602043151855, 6.875229835510254, 7.2941999435424805, 7.713170051574707, 8.132140159606934, 8.551109313964844, 8.97007942199707, 9.389049530029297, 9.808019638061523, 10.22698974609375, 10.645959854125977, 11.064929962158203, 11.48390007019043, 11.902870178222656, 12.321839332580566, 12.740809440612793, 13.15977954864502, 13.578749656677246, 13.997718811035156]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 14.0, 22.0, 28.0, 41.0, 61.0, 105.0, 173.0, 216.0, 382.0, 620.0, 960.0, 1721.0, 3190.0, 6105.0, 13030.0, 32265.0, 93003.0, 387015.0, 363862.0, 88887.0, 30809.0, 12703.0, 5809.0, 3121.0, 1683.0, 1013.0, 601.0, 381.0, 265.0, 141.0, 86.0, 70.0, 46.0, 34.0, 19.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.5908203125, -1.54107666015625, -1.4913330078125, -1.44158935546875, -1.391845703125, -1.34210205078125, -1.2923583984375, -1.24261474609375, -1.19287109375, -1.14312744140625, -1.0933837890625, -1.04364013671875, -0.993896484375, -0.94415283203125, -0.8944091796875, -0.84466552734375, -0.794921875, -0.74517822265625, -0.6954345703125, -0.64569091796875, -0.595947265625, -0.54620361328125, -0.4964599609375, -0.44671630859375, -0.39697265625, -0.34722900390625, -0.2974853515625, -0.24774169921875, -0.197998046875, -0.14825439453125, -0.0985107421875, -0.04876708984375, 0.0009765625, 0.05072021484375, 0.1004638671875, 0.15020751953125, 0.199951171875, 0.24969482421875, 0.2994384765625, 0.34918212890625, 0.39892578125, 0.44866943359375, 0.4984130859375, 0.54815673828125, 0.597900390625, 0.64764404296875, 0.6973876953125, 0.74713134765625, 0.796875, 0.84661865234375, 0.8963623046875, 0.94610595703125, 0.995849609375, 1.04559326171875, 1.0953369140625, 1.14508056640625, 1.19482421875, 1.24456787109375, 1.2943115234375, 1.34405517578125, 1.393798828125, 1.44354248046875, 1.4932861328125, 1.54302978515625, 1.5927734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 10.0, 8.0, 12.0, 12.0, 13.0, 16.0, 24.0, 26.0, 32.0, 43.0, 35.0, 42.0, 51.0, 50.0, 44.0, 50.0, 35.0, 54.0, 44.0, 47.0, 51.0, 45.0, 34.0, 37.0, 32.0, 23.0, 29.0, 19.0, 17.0, 14.0, 11.0, 9.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.23046875, -1.1959075927734375, -1.161346435546875, -1.1267852783203125, -1.09222412109375, -1.0576629638671875, -1.023101806640625, -0.9885406494140625, -0.9539794921875, -0.9194183349609375, -0.884857177734375, -0.8502960205078125, -0.81573486328125, -0.7811737060546875, -0.746612548828125, -0.7120513916015625, -0.677490234375, -0.6429290771484375, -0.608367919921875, -0.5738067626953125, -0.53924560546875, -0.5046844482421875, -0.470123291015625, -0.4355621337890625, -0.4010009765625, -0.3664398193359375, -0.331878662109375, -0.2973175048828125, -0.26275634765625, -0.2281951904296875, -0.193634033203125, -0.1590728759765625, -0.12451171875, -0.0899505615234375, -0.055389404296875, -0.0208282470703125, 0.01373291015625, 0.0482940673828125, 0.082855224609375, 0.1174163818359375, 0.1519775390625, 0.1865386962890625, 0.221099853515625, 0.2556610107421875, 0.29022216796875, 0.3247833251953125, 0.359344482421875, 0.3939056396484375, 0.428466796875, 0.4630279541015625, 0.497589111328125, 0.5321502685546875, 0.56671142578125, 0.6012725830078125, 0.635833740234375, 0.6703948974609375, 0.7049560546875, 0.7395172119140625, 0.774078369140625, 0.8086395263671875, 0.84320068359375, 0.8777618408203125, 0.912322998046875, 0.9468841552734375, 0.9814453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 12.0, 12.0, 11.0, 24.0, 31.0, 42.0, 68.0, 115.0, 174.0, 329.0, 690.0, 1853.0, 7295.0, 60937.0, 909814.0, 56762.0, 7040.0, 1857.0, 682.0, 321.0, 172.0, 118.0, 61.0, 49.0, 23.0, 15.0, 14.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.70703125, -3.602569580078125, -3.49810791015625, -3.393646240234375, -3.2891845703125, -3.184722900390625, -3.08026123046875, -2.975799560546875, -2.871337890625, -2.766876220703125, -2.66241455078125, -2.557952880859375, -2.4534912109375, -2.349029541015625, -2.24456787109375, -2.140106201171875, -2.03564453125, -1.931182861328125, -1.82672119140625, -1.722259521484375, -1.6177978515625, -1.513336181640625, -1.40887451171875, -1.304412841796875, -1.199951171875, -1.095489501953125, -0.99102783203125, -0.886566162109375, -0.7821044921875, -0.677642822265625, -0.57318115234375, -0.468719482421875, -0.3642578125, -0.259796142578125, -0.15533447265625, -0.050872802734375, 0.0535888671875, 0.158050537109375, 0.26251220703125, 0.366973876953125, 0.471435546875, 0.575897216796875, 0.68035888671875, 0.784820556640625, 0.8892822265625, 0.993743896484375, 1.09820556640625, 1.202667236328125, 1.30712890625, 1.411590576171875, 1.51605224609375, 1.620513916015625, 1.7249755859375, 1.829437255859375, 1.93389892578125, 2.038360595703125, 2.142822265625, 2.247283935546875, 2.35174560546875, 2.456207275390625, 2.5606689453125, 2.665130615234375, 2.76959228515625, 2.874053955078125, 2.978515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 6.0, 7.0, 12.0, 19.0, 19.0, 15.0, 20.0, 16.0, 19.0, 20.0, 35.0, 34.0, 52.0, 53.0, 77.0, 73.0, 75.0, 78.0, 52.0, 47.0, 38.0, 25.0, 31.0, 15.0, 25.0, 16.0, 15.0, 21.0, 3.0, 12.0, 12.0, 6.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.2734375, -4.142822265625, -4.01220703125, -3.881591796875, -3.7509765625, -3.620361328125, -3.48974609375, -3.359130859375, -3.228515625, -3.097900390625, -2.96728515625, -2.836669921875, -2.7060546875, -2.575439453125, -2.44482421875, -2.314208984375, -2.18359375, -2.052978515625, -1.92236328125, -1.791748046875, -1.6611328125, -1.530517578125, -1.39990234375, -1.269287109375, -1.138671875, -1.008056640625, -0.87744140625, -0.746826171875, -0.6162109375, -0.485595703125, -0.35498046875, -0.224365234375, -0.09375, 0.036865234375, 0.16748046875, 0.298095703125, 0.4287109375, 0.559326171875, 0.68994140625, 0.820556640625, 0.951171875, 1.081787109375, 1.21240234375, 1.343017578125, 1.4736328125, 1.604248046875, 1.73486328125, 1.865478515625, 1.99609375, 2.126708984375, 2.25732421875, 2.387939453125, 2.5185546875, 2.649169921875, 2.77978515625, 2.910400390625, 3.041015625, 3.171630859375, 3.30224609375, 3.432861328125, 3.5634765625, 3.694091796875, 3.82470703125, 3.955322265625, 4.0859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 6.0, 13.0, 12.0, 17.0, 28.0, 37.0, 49.0, 49.0, 107.0, 196.0, 343.0, 919.0, 2852.0, 13383.0, 157082.0, 843301.0, 23542.0, 4312.0, 1263.0, 474.0, 212.0, 119.0, 78.0, 36.0, 33.0, 26.0, 12.0, 8.0, 10.0, 11.0, 11.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.7966842651367188, -0.7711029052734375, -0.7455215454101562, -0.719940185546875, -0.6943588256835938, -0.6687774658203125, -0.6431961059570312, -0.61761474609375, -0.5920333862304688, -0.5664520263671875, -0.5408706665039062, -0.515289306640625, -0.48970794677734375, -0.4641265869140625, -0.43854522705078125, -0.4129638671875, -0.38738250732421875, -0.3618011474609375, -0.33621978759765625, -0.310638427734375, -0.28505706787109375, -0.2594757080078125, -0.23389434814453125, -0.20831298828125, -0.18273162841796875, -0.1571502685546875, -0.13156890869140625, -0.105987548828125, -0.08040618896484375, -0.0548248291015625, -0.02924346923828125, -0.003662109375, 0.02191925048828125, 0.0475006103515625, 0.07308197021484375, 0.098663330078125, 0.12424468994140625, 0.1498260498046875, 0.17540740966796875, 0.20098876953125, 0.22657012939453125, 0.2521514892578125, 0.27773284912109375, 0.303314208984375, 0.32889556884765625, 0.3544769287109375, 0.38005828857421875, 0.4056396484375, 0.43122100830078125, 0.4568023681640625, 0.48238372802734375, 0.507965087890625, 0.5335464477539062, 0.5591278076171875, 0.5847091674804688, 0.61029052734375, 0.6358718872070312, 0.6614532470703125, 0.6870346069335938, 0.712615966796875, 0.7381973266601562, 0.7637786865234375, 0.7893600463867188, 0.81494140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 7.0, 5.0, 13.0, 15.0, 22.0, 18.0, 23.0, 28.0, 54.0, 63.0, 95.0, 105.0, 103.0, 93.0, 65.0, 57.0, 48.0, 23.0, 35.0, 13.0, 14.0, 21.0, 7.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00016760826110839844, -0.00016271322965621948, -0.00015781819820404053, -0.00015292316675186157, -0.00014802813529968262, -0.00014313310384750366, -0.0001382380723953247, -0.00013334304094314575, -0.0001284480094909668, -0.00012355297803878784, -0.00011865794658660889, -0.00011376291513442993, -0.00010886788368225098, -0.00010397285223007202, -9.907782077789307e-05, -9.418278932571411e-05, -8.928775787353516e-05, -8.43927264213562e-05, -7.949769496917725e-05, -7.460266351699829e-05, -6.970763206481934e-05, -6.481260061264038e-05, -5.9917569160461426e-05, -5.502253770828247e-05, -5.0127506256103516e-05, -4.523247480392456e-05, -4.0337443351745605e-05, -3.544241189956665e-05, -3.0547380447387695e-05, -2.565234899520874e-05, -2.0757317543029785e-05, -1.586228609085083e-05, -1.0967254638671875e-05, -6.07222318649292e-06, -1.1771917343139648e-06, 3.7178397178649902e-06, 8.612871170043945e-06, 1.35079026222229e-05, 1.8402934074401855e-05, 2.329796552658081e-05, 2.8192996978759766e-05, 3.308802843093872e-05, 3.7983059883117676e-05, 4.287809133529663e-05, 4.7773122787475586e-05, 5.266815423965454e-05, 5.7563185691833496e-05, 6.245821714401245e-05, 6.73532485961914e-05, 7.224828004837036e-05, 7.714331150054932e-05, 8.203834295272827e-05, 8.693337440490723e-05, 9.182840585708618e-05, 9.672343730926514e-05, 0.00010161846876144409, 0.00010651350021362305, 0.000111408531665802, 0.00011630356311798096, 0.00012119859457015991, 0.00012609362602233887, 0.00013098865747451782, 0.00013588368892669678, 0.00014077872037887573, 0.0001456737518310547]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 6.0, 11.0, 19.0, 25.0, 35.0, 61.0, 92.0, 136.0, 216.0, 408.0, 755.0, 1852.0, 4892.0, 16288.0, 79402.0, 830221.0, 87473.0, 17547.0, 5232.0, 1915.0, 920.0, 384.0, 240.0, 154.0, 77.0, 56.0, 37.0, 20.0, 24.0, 12.0, 12.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.431640625, -0.4187660217285156, -0.40589141845703125, -0.3930168151855469, -0.3801422119140625, -0.3672676086425781, -0.35439300537109375, -0.3415184020996094, -0.328643798828125, -0.3157691955566406, -0.30289459228515625, -0.2900199890136719, -0.2771453857421875, -0.2642707824707031, -0.25139617919921875, -0.23852157592773438, -0.22564697265625, -0.21277236938476562, -0.19989776611328125, -0.18702316284179688, -0.1741485595703125, -0.16127395629882812, -0.14839935302734375, -0.13552474975585938, -0.122650146484375, -0.10977554321289062, -0.09690093994140625, -0.08402633666992188, -0.0711517333984375, -0.058277130126953125, -0.04540252685546875, -0.032527923583984375, -0.0196533203125, -0.006778717041015625, 0.00609588623046875, 0.018970489501953125, 0.0318450927734375, 0.044719696044921875, 0.05759429931640625, 0.07046890258789062, 0.083343505859375, 0.09621810913085938, 0.10909271240234375, 0.12196731567382812, 0.1348419189453125, 0.14771652221679688, 0.16059112548828125, 0.17346572875976562, 0.18634033203125, 0.19921493530273438, 0.21208953857421875, 0.22496414184570312, 0.2378387451171875, 0.2507133483886719, 0.26358795166015625, 0.2764625549316406, 0.289337158203125, 0.3022117614746094, 0.31508636474609375, 0.3279609680175781, 0.3408355712890625, 0.3537101745605469, 0.36658477783203125, 0.3794593811035156, 0.392333984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 4.0, 9.0, 12.0, 14.0, 11.0, 20.0, 7.0, 15.0, 11.0, 37.0, 36.0, 44.0, 65.0, 71.0, 108.0, 113.0, 75.0, 51.0, 55.0, 29.0, 26.0, 20.0, 32.0, 18.0, 10.0, 7.0, 7.0, 13.0, 13.0, 9.0, 3.0, 5.0, 4.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.4091796875, -0.3961830139160156, -0.38318634033203125, -0.3701896667480469, -0.3571929931640625, -0.3441963195800781, -0.33119964599609375, -0.3182029724121094, -0.305206298828125, -0.2922096252441406, -0.27921295166015625, -0.2662162780761719, -0.2532196044921875, -0.24022293090820312, -0.22722625732421875, -0.21422958374023438, -0.20123291015625, -0.18823623657226562, -0.17523956298828125, -0.16224288940429688, -0.1492462158203125, -0.13624954223632812, -0.12325286865234375, -0.11025619506835938, -0.097259521484375, -0.08426284790039062, -0.07126617431640625, -0.058269500732421875, -0.0452728271484375, -0.032276153564453125, -0.01927947998046875, -0.006282806396484375, 0.0067138671875, 0.019710540771484375, 0.03270721435546875, 0.045703887939453125, 0.0587005615234375, 0.07169723510742188, 0.08469390869140625, 0.09769058227539062, 0.110687255859375, 0.12368392944335938, 0.13668060302734375, 0.14967727661132812, 0.1626739501953125, 0.17567062377929688, 0.18866729736328125, 0.20166397094726562, 0.21466064453125, 0.22765731811523438, 0.24065399169921875, 0.2536506652832031, 0.2666473388671875, 0.2796440124511719, 0.29264068603515625, 0.3056373596191406, 0.318634033203125, 0.3316307067871094, 0.34462738037109375, 0.3576240539550781, 0.3706207275390625, 0.3836174011230469, 0.39661407470703125, 0.4096107482910156, 0.422607421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 12.0, 27.0, 92.0, 632.0, 155.0, 60.0, 17.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.067142486572266, -43.76972579956055, -42.47230911254883, -41.17489242553711, -39.877479553222656, -38.58006286621094, -37.28264617919922, -35.9852294921875, -34.68781280517578, -33.39039611816406, -32.092979431152344, -30.795564651489258, -29.49814796447754, -28.20073127746582, -26.903316497802734, -25.605899810791016, -24.308483123779297, -23.011066436767578, -21.71364974975586, -20.416234970092773, -19.118818283081055, -17.821401596069336, -16.52398681640625, -15.226570129394531, -13.929153442382812, -12.631736755371094, -11.334321022033691, -10.036905288696289, -8.73948860168457, -7.44207239151001, -6.144656181335449, -4.847240447998047, -3.5498275756835938, -2.252411365509033, -0.9549951553344727, 0.3424210548400879, 1.6398372650146484, 2.937253475189209, 4.2346696853637695, 5.532085418701172, 6.829502105712891, 8.12691879272461, 9.424334526062012, 10.721750259399414, 12.019166946411133, 13.316583633422852, 14.613999366760254, 15.911415100097656, 17.208831787109375, 18.506248474121094, 19.803665161132812, 21.1010799407959, 22.398496627807617, 23.695913314819336, 24.993328094482422, 26.29074478149414, 27.58816146850586, 28.885578155517578, 30.182994842529297, 31.480409622192383, 32.77782440185547, 34.07524108886719, 35.372657775878906, 36.670074462890625, 37.967491149902344]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 11.0, 11.0, 7.0, 15.0, 16.0, 23.0, 21.0, 27.0, 32.0, 48.0, 133.0, 382.0, 62.0, 37.0, 29.0, 35.0, 23.0, 21.0, 17.0, 19.0, 9.0, 12.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.31124496459961, -25.717653274536133, -25.124059677124023, -24.530467987060547, -23.93687629699707, -23.343284606933594, -22.749691009521484, -22.156099319458008, -21.56250762939453, -20.968915939331055, -20.375322341918945, -19.78173065185547, -19.188138961791992, -18.594547271728516, -18.000953674316406, -17.40736198425293, -16.813770294189453, -16.220178604125977, -15.626585960388184, -15.03299331665039, -14.439401626586914, -13.845808982849121, -13.252216339111328, -12.658624649047852, -12.065031051635742, -11.47143840789795, -10.877846717834473, -10.28425407409668, -9.690662384033203, -9.09706974029541, -8.503477096557617, -7.909885406494141, -7.3162946701049805, -6.722702503204346, -6.129110336303711, -5.535517692565918, -4.941926002502441, -4.348333358764648, -3.7547411918640137, -3.161149024963379, -2.567556858062744, -1.9739646911621094, -1.380372405052185, -0.7867801189422607, -0.19318795204162598, 0.4004042148590088, 0.9939966201782227, 1.5875887870788574, 2.181180953979492, 2.774773120880127, 3.3683652877807617, 3.9619576930999756, 4.555549621582031, 5.149142265319824, 5.742734432220459, 6.336326599121094, 6.9299187660217285, 7.523510932922363, 8.117103576660156, 8.710695266723633, 9.304287910461426, 9.897879600524902, 10.491472244262695, 11.085063934326172, 11.678656578063965]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 9.0, 16.0, 17.0, 9.0, 20.0, 19.0, 28.0, 25.0, 24.0, 28.0, 45.0, 85.0, 201.0, 116.0, 53.0, 27.0, 27.0, 30.0, 27.0, 28.0, 17.0, 16.0, 19.0, 16.0, 22.0, 7.0, 11.0, 7.0, 6.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9863510131835938, -0.9570770263671875, -0.9278030395507812, -0.898529052734375, -0.8692550659179688, -0.8399810791015625, -0.8107070922851562, -0.78143310546875, -0.7521591186523438, -0.7228851318359375, -0.6936111450195312, -0.664337158203125, -0.6350631713867188, -0.6057891845703125, -0.5765151977539062, -0.5472412109375, -0.5179672241210938, -0.4886932373046875, -0.45941925048828125, -0.430145263671875, -0.40087127685546875, -0.3715972900390625, -0.34232330322265625, -0.31304931640625, -0.28377532958984375, -0.2545013427734375, -0.22522735595703125, -0.195953369140625, -0.16667938232421875, -0.1374053955078125, -0.10813140869140625, -0.078857421875, -0.04958343505859375, -0.0203094482421875, 0.00896453857421875, 0.038238525390625, 0.06751251220703125, 0.0967864990234375, 0.12606048583984375, 0.15533447265625, 0.18460845947265625, 0.2138824462890625, 0.24315643310546875, 0.272430419921875, 0.30170440673828125, 0.3309783935546875, 0.36025238037109375, 0.3895263671875, 0.41880035400390625, 0.4480743408203125, 0.47734832763671875, 0.506622314453125, 0.5358963012695312, 0.5651702880859375, 0.5944442749023438, 0.62371826171875, 0.6529922485351562, 0.6822662353515625, 0.7115402221679688, 0.740814208984375, 0.7700881958007812, 0.7993621826171875, 0.8286361694335938, 0.85791015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 15.0, 6.0, 21.0, 24.0, 57.0, 160.0, 483.0, 2502.0, 42343.0, 8336921.0, 4849.0, 800.0, 202.0, 75.0, 35.0, 31.0, 9.0, 6.0, 7.0, 6.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-14.636923789978027, -14.151557922363281, -13.666192054748535, -13.180826187133789, -12.695460319519043, -12.210094451904297, -11.724727630615234, -11.239362716674805, -10.753995895385742, -10.268630027770996, -9.78326416015625, -9.297898292541504, -8.812532424926758, -8.327166557312012, -7.841800212860107, -7.356434345245361, -6.871068954467773, -6.385703086853027, -5.900337219238281, -5.414971351623535, -4.929605484008789, -4.444239616394043, -3.9588732719421387, -3.4735074043273926, -2.9881415367126465, -2.5027756690979004, -2.0174098014831543, -1.532043695449829, -1.046677827835083, -0.5613119602203369, -0.07594585418701172, 0.4094200134277344, 0.8947849273681641, 1.3801507949829102, 1.8655167818069458, 2.3508827686309814, 2.8362486362457275, 3.3216145038604736, 3.806980609893799, 4.292346477508545, 4.777712345123291, 5.263078212738037, 5.748444080352783, 6.2338104248046875, 6.719176292419434, 7.20454216003418, 7.689908027648926, 8.175273895263672, 8.660639762878418, 9.146005630493164, 9.63137149810791, 10.116737365722656, 10.602103233337402, 11.087469100952148, 11.572835922241211, 12.05820083618164, 12.543567657470703, 13.02893352508545, 13.514299392700195, 13.999665260314941, 14.485031127929688, 14.970396995544434, 15.45576286315918, 15.941129684448242, 16.426494598388672]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 7.0, 1.0, 5.0, 4.0, 11.0, 4.0, 7.0, 4.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-11.512982368469238, -11.189505577087402, -10.866028785705566, -10.54255199432373, -10.219076156616211, -9.895599365234375, -9.572122573852539, -9.248645782470703, -8.925168991088867, -8.601692199707031, -8.278215408325195, -7.954739093780518, -7.631262302398682, -7.307785511016846, -6.984309196472168, -6.660832405090332, -6.337355613708496, -6.01387882232666, -5.690402030944824, -5.3669257164001465, -5.0434489250183105, -4.719972133636475, -4.396495819091797, -4.073019027709961, -3.749542236328125, -3.426065444946289, -3.1025888919830322, -2.7791123390197754, -2.4556355476379395, -2.1321587562561035, -1.8086822032928467, -1.4852056503295898, -1.1617279052734375, -0.8382512331008911, -0.5147745609283447, -0.19129788875579834, 0.13217878341674805, 0.45565545558929443, 0.7791321277618408, 1.1026086807250977, 1.4260854721069336, 1.74956214427948, 2.0730388164520264, 2.396515369415283, 2.719992160797119, 3.043468952178955, 3.366945505142212, 3.6904220581054688, 4.013898849487305, 4.337375640869141, 4.660852432250977, 4.984328746795654, 5.30780553817749, 5.631282329559326, 5.954758644104004, 6.27823543548584, 6.601712226867676, 6.925189018249512, 7.248665809631348, 7.572142124176025, 7.895618915557861, 8.219095230102539, 8.542572021484375, 8.866048812866211, 9.189525604248047]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 15.0, 10.0, 14.0, 19.0, 16.0, 24.0, 38.0, 41.0, 53.0, 95.0, 117.0, 185.0, 312.0, 623.0, 1303.0, 3017.0, 7527.0, 20047.0, 55782.0, 149823.0, 175897.0, 69207.0, 24273.0, 9190.0, 3497.0, 1459.0, 683.0, 360.0, 189.0, 114.0, 91.0, 58.0, 48.0, 33.0, 23.0, 19.0, 15.0, 9.0, 7.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.8671875, -7.629638671875, -7.39208984375, -7.154541015625, -6.9169921875, -6.679443359375, -6.44189453125, -6.204345703125, -5.966796875, -5.729248046875, -5.49169921875, -5.254150390625, -5.0166015625, -4.779052734375, -4.54150390625, -4.303955078125, -4.06640625, -3.828857421875, -3.59130859375, -3.353759765625, -3.1162109375, -2.878662109375, -2.64111328125, -2.403564453125, -2.166015625, -1.928466796875, -1.69091796875, -1.453369140625, -1.2158203125, -0.978271484375, -0.74072265625, -0.503173828125, -0.265625, -0.028076171875, 0.20947265625, 0.447021484375, 0.6845703125, 0.922119140625, 1.15966796875, 1.397216796875, 1.634765625, 1.872314453125, 2.10986328125, 2.347412109375, 2.5849609375, 2.822509765625, 3.06005859375, 3.297607421875, 3.53515625, 3.772705078125, 4.01025390625, 4.247802734375, 4.4853515625, 4.722900390625, 4.96044921875, 5.197998046875, 5.435546875, 5.673095703125, 5.91064453125, 6.148193359375, 6.3857421875, 6.623291015625, 6.86083984375, 7.098388671875, 7.3359375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 9.0, 4.0, 4.0, 20.0, 12.0, 20.0, 25.0, 28.0, 30.0, 51.0, 56.0, 56.0, 70.0, 69.0, 64.0, 84.0, 69.0, 57.0, 37.0, 54.0, 36.0, 26.0, 17.0, 17.0, 14.0, 18.0, 11.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3701171875, -1.33001708984375, -1.2899169921875, -1.24981689453125, -1.209716796875, -1.16961669921875, -1.1295166015625, -1.08941650390625, -1.04931640625, -1.00921630859375, -0.9691162109375, -0.92901611328125, -0.888916015625, -0.84881591796875, -0.8087158203125, -0.76861572265625, -0.728515625, -0.68841552734375, -0.6483154296875, -0.60821533203125, -0.568115234375, -0.52801513671875, -0.4879150390625, -0.44781494140625, -0.40771484375, -0.36761474609375, -0.3275146484375, -0.28741455078125, -0.247314453125, -0.20721435546875, -0.1671142578125, -0.12701416015625, -0.0869140625, -0.04681396484375, -0.0067138671875, 0.03338623046875, 0.073486328125, 0.11358642578125, 0.1536865234375, 0.19378662109375, 0.23388671875, 0.27398681640625, 0.3140869140625, 0.35418701171875, 0.394287109375, 0.43438720703125, 0.4744873046875, 0.51458740234375, 0.5546875, 0.59478759765625, 0.6348876953125, 0.67498779296875, 0.715087890625, 0.75518798828125, 0.7952880859375, 0.83538818359375, 0.87548828125, 0.91558837890625, 0.9556884765625, 0.99578857421875, 1.035888671875, 1.07598876953125, 1.1160888671875, 1.15618896484375, 1.1962890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 19.0, 16.0, 65.0, 133.0, 125.0, 70.0, 18.0, 10.0, 10.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671615600585938, -8.208333015441895, -7.74505090713501, -7.281768321990967, -6.818486213684082, -6.355203628540039, -5.891921043395996, -5.428638935089111, -4.965356826782227, -4.502074241638184, -4.038792133331299, -3.575509548187256, -3.112227439880371, -2.648944854736328, -2.1856625080108643, -1.7223801612854004, -1.2590975761413574, -0.7958152294158936, -0.3325328230857849, 0.13074958324432373, 0.5940319299697876, 1.057314395904541, 1.5205967426300049, 1.9838790893554688, 2.4471614360809326, 2.9104437828063965, 3.3737261295318604, 3.837008476257324, 4.300291061401367, 4.76357364654541, 5.226855754852295, 5.69013786315918, 6.153420448303223, 6.616703033447266, 7.07998514175415, 7.543267726898193, 8.006549835205078, 8.469832420349121, 8.933115005493164, 9.39639663696289, 9.859679222106934, 10.322961807250977, 10.78624439239502, 11.249526023864746, 11.712808609008789, 12.176091194152832, 12.639373779296875, 13.102655410766602, 13.565938949584961, 14.029221534729004, 14.492504119873047, 14.955785751342773, 15.419068336486816, 15.88235092163086, 16.345632553100586, 16.808916091918945, 17.272197723388672, 17.7354793548584, 18.198762893676758, 18.662044525146484, 19.125328063964844, 19.58860969543457, 20.051891326904297, 20.515174865722656, 20.978456497192383]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 7.0, 5.0, 9.0, 8.0, 21.0, 42.0, 127.0, 121.0, 60.0, 18.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.394720077514648, -9.122709274291992, -8.850698471069336, -8.578688621520996, -8.30667781829834, -8.034667015075684, -7.762656211853027, -7.490645408630371, -7.218635082244873, -6.946624279022217, -6.674613952636719, -6.4026031494140625, -6.130592346191406, -5.858582019805908, -5.586571216583252, -5.314560890197754, -5.042550086975098, -4.770539283752441, -4.498528957366943, -4.226518154144287, -3.95450758934021, -3.682497024536133, -3.4104862213134766, -3.1384756565093994, -2.8664650917053223, -2.594454526901245, -2.322443962097168, -2.0504331588745117, -1.7784225940704346, -1.5064120292663574, -1.2344013452529907, -0.962390661239624, -0.6903800964355469, -0.41836947202682495, -0.14635884761810303, 0.1256517767906189, 0.3976624011993408, 0.669672966003418, 0.9416836500167847, 1.2136943340301514, 1.4857048988342285, 1.7577154636383057, 2.029726028442383, 2.301736831665039, 2.573747396469116, 2.8457579612731934, 3.1177687644958496, 3.3897793292999268, 3.661789894104004, 3.933800458908081, 4.205811023712158, 4.4778218269348145, 4.7498321533203125, 5.021842956542969, 5.293853759765625, 5.565864562988281, 5.837874889373779, 6.1098856925964355, 6.381896018981934, 6.65390682220459, 6.925917625427246, 7.197927951812744, 7.4699387550354, 7.741949081420898, 8.013959884643555]}, "eval/loss": 4.192998886108398, "eval/wer": 1.903669178897263, "eval/runtime": 786.9912, "eval/samples_per_second": 3.357, "eval/steps_per_second": 0.281} \ No newline at end of file +{"train/loss": 4.3516, "train/learning_rate": 1.741654571843251e-07, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6714, "_timestamp": 1646129566, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 680.0, 301.0, 7.0, 1.0], "bins": [-571.5680541992188, -562.168701171875, -552.7693481445312, -543.3699951171875, -533.9706420898438, -524.5712890625, -515.171875, -505.7725524902344, -496.3731689453125, -486.97381591796875, -477.574462890625, -468.1750793457031, -458.7757263183594, -449.3763732910156, -439.9770202636719, -430.5776672363281, -421.1783142089844, -411.7789611816406, -402.3796081542969, -392.980224609375, -383.58087158203125, -374.1815185546875, -364.78216552734375, -355.3828125, -345.98345947265625, -336.5841064453125, -327.18475341796875, -317.7853698730469, -308.3860168457031, -298.9866638183594, -289.5873107910156, -280.1879577636719, -270.78857421875, -261.38922119140625, -251.98985290527344, -242.5904998779297, -233.19113159179688, -223.79177856445312, -214.39242553710938, -204.99307250976562, -195.59368896484375, -186.1943359375, -176.7949676513672, -167.39561462402344, -157.99624633789062, -148.59689331054688, -139.19754028320312, -129.79818725585938, -120.3988265991211, -110.99946594238281, -101.60011291503906, -92.20075225830078, -82.8013916015625, -73.40203094482422, -64.00267028808594, -54.60331726074219, -45.203956604003906, -35.804595947265625, -26.40523910522461, -17.00588035583496, -7.6065216064453125, 1.7928390502929688, 11.192195892333984, 20.591552734375, 29.990915298461914]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 9.0, 13.0, 12.0, 15.0, 26.0, 23.0, 30.0, 20.0, 28.0, 43.0, 47.0, 31.0, 42.0, 57.0, 39.0, 53.0, 49.0, 51.0, 40.0, 54.0, 45.0, 24.0, 26.0, 34.0, 19.0, 30.0, 12.0, 17.0, 17.0, 10.0, 11.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.36842346191406, -51.56277847290039, -49.75713348388672, -47.95148849487305, -46.145843505859375, -44.3401985168457, -42.53455352783203, -40.728904724121094, -38.92326354980469, -37.117618560791016, -35.311973571777344, -33.50632858276367, -31.70068359375, -29.895038604736328, -28.089391708374023, -26.28374671936035, -24.478099822998047, -22.672454833984375, -20.866809844970703, -19.06116485595703, -17.25551986694336, -15.449873924255371, -13.644227981567383, -11.838582992553711, -10.032938003540039, -8.227293014526367, -6.421647548675537, -4.616002082824707, -2.810357093811035, -1.0047121047973633, 0.800933837890625, 2.606578826904297, 4.412223815917969, 6.217868804931641, 8.023513793945312, 9.8291597366333, 11.634804725646973, 13.440449714660645, 15.246095657348633, 17.051740646362305, 18.857385635375977, 20.66303062438965, 22.46867561340332, 24.274322509765625, 26.079967498779297, 27.88561248779297, 29.69125747680664, 31.496902465820312, 33.302547454833984, 35.108192443847656, 36.91383743286133, 38.719482421875, 40.52512741088867, 42.330772399902344, 44.13642120361328, 45.94206237792969, 47.747711181640625, 49.5533561706543, 51.35900115966797, 53.16464614868164, 54.97029113769531, 56.775936126708984, 58.581581115722656, 60.387229919433594, 62.19287109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 10.0, 15.0, 17.0, 27.0, 42.0, 51.0, 54.0, 68.0, 81.0, 76.0, 97.0, 91.0, 87.0, 69.0, 55.0, 35.0, 38.0, 23.0, 26.0, 15.0, 9.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.70703125, -7.525390625, -7.34375, -7.162109375, -6.98046875, -6.798828125, -6.6171875, -6.435546875, -6.25390625, -6.072265625, -5.890625, -5.708984375, -5.52734375, -5.345703125, -5.1640625, -4.982421875, -4.80078125, -4.619140625, -4.4375, -4.255859375, -4.07421875, -3.892578125, -3.7109375, -3.529296875, -3.34765625, -3.166015625, -2.984375, -2.802734375, -2.62109375, -2.439453125, -2.2578125, -2.076171875, -1.89453125, -1.712890625, -1.53125, -1.349609375, -1.16796875, -0.986328125, -0.8046875, -0.623046875, -0.44140625, -0.259765625, -0.078125, 0.103515625, 0.28515625, 0.466796875, 0.6484375, 0.830078125, 1.01171875, 1.193359375, 1.375, 1.556640625, 1.73828125, 1.919921875, 2.1015625, 2.283203125, 2.46484375, 2.646484375, 2.828125, 3.009765625, 3.19140625, 3.373046875, 3.5546875, 3.736328125, 3.91796875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 7.0, 11.0, 15.0, 14.0, 26.0, 39.0, 78.0, 114.0, 244.0, 480.0, 1043.0, 2971.0, 12037.0, 112525.0, 3599716.0, 434632.0, 22931.0, 4657.0, 1478.0, 619.0, 279.0, 145.0, 78.0, 56.0, 39.0, 21.0, 15.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.484375, -25.833251953125, -25.18212890625, -24.531005859375, -23.8798828125, -23.228759765625, -22.57763671875, -21.926513671875, -21.275390625, -20.624267578125, -19.97314453125, -19.322021484375, -18.6708984375, -18.019775390625, -17.36865234375, -16.717529296875, -16.06640625, -15.415283203125, -14.76416015625, -14.113037109375, -13.4619140625, -12.810791015625, -12.15966796875, -11.508544921875, -10.857421875, -10.206298828125, -9.55517578125, -8.904052734375, -8.2529296875, -7.601806640625, -6.95068359375, -6.299560546875, -5.6484375, -4.997314453125, -4.34619140625, -3.695068359375, -3.0439453125, -2.392822265625, -1.74169921875, -1.090576171875, -0.439453125, 0.211669921875, 0.86279296875, 1.513916015625, 2.1650390625, 2.816162109375, 3.46728515625, 4.118408203125, 4.76953125, 5.420654296875, 6.07177734375, 6.722900390625, 7.3740234375, 8.025146484375, 8.67626953125, 9.327392578125, 9.978515625, 10.629638671875, 11.28076171875, 11.931884765625, 12.5830078125, 13.234130859375, 13.88525390625, 14.536376953125, 15.1875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 8.0, 15.0, 24.0, 39.0, 64.0, 102.0, 186.0, 303.0, 565.0, 924.0, 785.0, 450.0, 247.0, 140.0, 85.0, 46.0, 33.0, 16.0, 11.0, 6.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.0625, -25.4390869140625, -24.815673828125, -24.1922607421875, -23.56884765625, -22.9454345703125, -22.322021484375, -21.6986083984375, -21.0751953125, -20.4517822265625, -19.828369140625, -19.2049560546875, -18.58154296875, -17.9581298828125, -17.334716796875, -16.7113037109375, -16.087890625, -15.4644775390625, -14.841064453125, -14.2176513671875, -13.59423828125, -12.9708251953125, -12.347412109375, -11.7239990234375, -11.1005859375, -10.4771728515625, -9.853759765625, -9.2303466796875, -8.60693359375, -7.9835205078125, -7.360107421875, -6.7366943359375, -6.11328125, -5.4898681640625, -4.866455078125, -4.2430419921875, -3.61962890625, -2.9962158203125, -2.372802734375, -1.7493896484375, -1.1259765625, -0.5025634765625, 0.120849609375, 0.7442626953125, 1.36767578125, 1.9910888671875, 2.614501953125, 3.2379150390625, 3.861328125, 4.4847412109375, 5.108154296875, 5.7315673828125, 6.35498046875, 6.9783935546875, 7.601806640625, 8.2252197265625, 8.8486328125, 9.4720458984375, 10.095458984375, 10.7188720703125, 11.34228515625, 11.9656982421875, 12.589111328125, 13.2125244140625, 13.8359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 6.0, 14.0, 17.0, 51.0, 73.0, 166.0, 392.0, 1072.0, 4721.0, 3545464.0, 637411.0, 3411.0, 864.0, 309.0, 133.0, 72.0, 33.0, 34.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -78.71484375, -75.9921875, -73.26953125, -70.546875, -67.82421875, -65.1015625, -62.37890625, -59.65625, -56.93359375, -54.2109375, -51.48828125, -48.765625, -46.04296875, -43.3203125, -40.59765625, -37.875, -35.15234375, -32.4296875, -29.70703125, -26.984375, -24.26171875, -21.5390625, -18.81640625, -16.09375, -13.37109375, -10.6484375, -7.92578125, -5.203125, -2.48046875, 0.2421875, 2.96484375, 5.6875, 8.41015625, 11.1328125, 13.85546875, 16.578125, 19.30078125, 22.0234375, 24.74609375, 27.46875, 30.19140625, 32.9140625, 35.63671875, 38.359375, 41.08203125, 43.8046875, 46.52734375, 49.25, 51.97265625, 54.6953125, 57.41796875, 60.140625, 62.86328125, 65.5859375, 68.30859375, 71.03125, 73.75390625, 76.4765625, 79.19921875, 81.921875, 84.64453125, 87.3671875, 90.08984375, 92.8125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 74.0, 299.0, 391.0, 176.0, 42.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.13645553588867, -28.68865203857422, -25.240848541259766, -21.793045043945312, -18.34524154663086, -14.897438049316406, -11.449634552001953, -8.0018310546875, -4.554027557373047, -1.1062240600585938, 2.3415794372558594, 5.7893829345703125, 9.237186431884766, 12.684989929199219, 16.132793426513672, 19.580596923828125, 23.028400421142578, 26.47620391845703, 29.924007415771484, 33.37181091308594, 36.81961441040039, 40.267417907714844, 43.7152214050293, 47.16302490234375, 50.6108283996582, 54.058631896972656, 57.50643539428711, 60.95423889160156, 64.40203857421875, 67.84984588623047, 71.29765319824219, 74.74545288085938, 78.19325256347656, 81.64105224609375, 85.08885955810547, 88.53666687011719, 91.98446655273438, 95.43226623535156, 98.88007354736328, 102.327880859375, 105.77568054199219, 109.22348022460938, 112.6712875366211, 116.11909484863281, 119.56689453125, 123.01469421386719, 126.4625015258789, 129.91030883789062, 133.3581085205078, 136.805908203125, 140.25372314453125, 143.70152282714844, 147.14932250976562, 150.5971221923828, 154.044921875, 157.49273681640625, 160.94053649902344, 164.38833618164062, 167.83615112304688, 171.28395080566406, 174.73175048828125, 178.17955017089844, 181.62734985351562, 185.07516479492188, 188.52296447753906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 10.0, 13.0, 17.0, 15.0, 22.0, 38.0, 32.0, 40.0, 48.0, 52.0, 58.0, 50.0, 61.0, 57.0, 54.0, 68.0, 48.0, 61.0, 39.0, 43.0, 29.0, 28.0, 23.0, 23.0, 15.0, 10.0, 12.0, 8.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.120880126953125, -53.443641662597656, -51.76640319824219, -50.08916473388672, -48.41192626953125, -46.73468780517578, -45.05744552612305, -43.38020706176758, -41.70296859741211, -40.02573013305664, -38.34849166870117, -36.6712532043457, -34.99401092529297, -33.3167724609375, -31.63953399658203, -29.962295532226562, -28.285057067871094, -26.607818603515625, -24.930580139160156, -23.253339767456055, -21.576101303100586, -19.898862838745117, -18.221622467041016, -16.544384002685547, -14.867145538330078, -13.18990707397461, -11.512667655944824, -9.835428237915039, -8.15818977355957, -6.480951309204102, -4.803711891174316, -3.1264724731445312, -1.4492340087890625, 0.22800493240356445, 1.9052438735961914, 3.5824828147888184, 5.259721755981445, 6.936960220336914, 8.6141996383667, 10.291439056396484, 11.968677520751953, 13.645915985107422, 15.323155403137207, 17.000394821166992, 18.67763328552246, 20.35487174987793, 22.03211212158203, 23.7093505859375, 25.38658905029297, 27.063827514648438, 28.741065979003906, 30.418306350708008, 32.095542907714844, 33.77278137207031, 35.45002365112305, 37.127262115478516, 38.804500579833984, 40.48173904418945, 42.15897750854492, 43.83621597290039, 45.513458251953125, 47.190696716308594, 48.86793518066406, 50.54517364501953, 52.222412109375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 13.0, 15.0, 12.0, 16.0, 17.0, 25.0, 26.0, 26.0, 26.0, 43.0, 40.0, 40.0, 49.0, 63.0, 64.0, 65.0, 65.0, 60.0, 67.0, 38.0, 34.0, 34.0, 28.0, 26.0, 19.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.9921875, -4.8699951171875, -4.747802734375, -4.6256103515625, -4.50341796875, -4.3812255859375, -4.259033203125, -4.1368408203125, -4.0146484375, -3.8924560546875, -3.770263671875, -3.6480712890625, -3.52587890625, -3.4036865234375, -3.281494140625, -3.1593017578125, -3.037109375, -2.9149169921875, -2.792724609375, -2.6705322265625, -2.54833984375, -2.4261474609375, -2.303955078125, -2.1817626953125, -2.0595703125, -1.9373779296875, -1.815185546875, -1.6929931640625, -1.57080078125, -1.4486083984375, -1.326416015625, -1.2042236328125, -1.08203125, -0.9598388671875, -0.837646484375, -0.7154541015625, -0.59326171875, -0.4710693359375, -0.348876953125, -0.2266845703125, -0.1044921875, 0.0177001953125, 0.139892578125, 0.2620849609375, 0.38427734375, 0.5064697265625, 0.628662109375, 0.7508544921875, 0.873046875, 0.9952392578125, 1.117431640625, 1.2396240234375, 1.36181640625, 1.4840087890625, 1.606201171875, 1.7283935546875, 1.8505859375, 1.9727783203125, 2.094970703125, 2.2171630859375, 2.33935546875, 2.4615478515625, 2.583740234375, 2.7059326171875, 2.828125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 8.0, 19.0, 22.0, 29.0, 48.0, 63.0, 113.0, 149.0, 236.0, 394.0, 601.0, 959.0, 1544.0, 2700.0, 4523.0, 7869.0, 14193.0, 26898.0, 51923.0, 105188.0, 234836.0, 304580.0, 145208.0, 68993.0, 34600.0, 18535.0, 10306.0, 5606.0, 3285.0, 1886.0, 1227.0, 704.0, 442.0, 263.0, 201.0, 138.0, 85.0, 40.0, 33.0, 31.0, 16.0, 16.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5443496704101562, -0.5257110595703125, -0.5070724487304688, -0.488433837890625, -0.46979522705078125, -0.4511566162109375, -0.43251800537109375, -0.41387939453125, -0.39524078369140625, -0.3766021728515625, -0.35796356201171875, -0.339324951171875, -0.32068634033203125, -0.3020477294921875, -0.28340911865234375, -0.2647705078125, -0.24613189697265625, -0.2274932861328125, -0.20885467529296875, -0.190216064453125, -0.17157745361328125, -0.1529388427734375, -0.13430023193359375, -0.11566162109375, -0.09702301025390625, -0.0783843994140625, -0.05974578857421875, -0.041107177734375, -0.02246856689453125, -0.0038299560546875, 0.01480865478515625, 0.033447265625, 0.05208587646484375, 0.0707244873046875, 0.08936309814453125, 0.108001708984375, 0.12664031982421875, 0.1452789306640625, 0.16391754150390625, 0.18255615234375, 0.20119476318359375, 0.2198333740234375, 0.23847198486328125, 0.257110595703125, 0.27574920654296875, 0.2943878173828125, 0.31302642822265625, 0.3316650390625, 0.35030364990234375, 0.3689422607421875, 0.38758087158203125, 0.406219482421875, 0.42485809326171875, 0.4434967041015625, 0.46213531494140625, 0.48077392578125, 0.49941253662109375, 0.5180511474609375, 0.5366897583007812, 0.555328369140625, 0.5739669799804688, 0.5926055908203125, 0.6112442016601562, 0.6298828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 9.0, 10.0, 9.0, 9.0, 7.0, 10.0, 19.0, 19.0, 20.0, 21.0, 23.0, 34.0, 25.0, 37.0, 31.0, 39.0, 38.0, 45.0, 36.0, 37.0, 1069.0, 44.0, 24.0, 42.0, 32.0, 37.0, 37.0, 31.0, 25.0, 21.0, 29.0, 24.0, 19.0, 17.0, 19.0, 16.0, 10.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7237091064453125, -1.665191650390625, -1.6066741943359375, -1.54815673828125, -1.4896392822265625, -1.431121826171875, -1.3726043701171875, -1.3140869140625, -1.2555694580078125, -1.197052001953125, -1.1385345458984375, -1.08001708984375, -1.0214996337890625, -0.962982177734375, -0.9044647216796875, -0.845947265625, -0.7874298095703125, -0.728912353515625, -0.6703948974609375, -0.61187744140625, -0.5533599853515625, -0.494842529296875, -0.4363250732421875, -0.3778076171875, -0.3192901611328125, -0.260772705078125, -0.2022552490234375, -0.14373779296875, -0.0852203369140625, -0.026702880859375, 0.0318145751953125, 0.09033203125, 0.1488494873046875, 0.207366943359375, 0.2658843994140625, 0.32440185546875, 0.3829193115234375, 0.441436767578125, 0.4999542236328125, 0.5584716796875, 0.6169891357421875, 0.675506591796875, 0.7340240478515625, 0.79254150390625, 0.8510589599609375, 0.909576416015625, 0.9680938720703125, 1.026611328125, 1.0851287841796875, 1.143646240234375, 1.2021636962890625, 1.26068115234375, 1.3191986083984375, 1.377716064453125, 1.4362335205078125, 1.4947509765625, 1.5532684326171875, 1.611785888671875, 1.6703033447265625, 1.72882080078125, 1.7873382568359375, 1.845855712890625, 1.9043731689453125, 1.962890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 6.0, 6.0, 9.0, 21.0, 36.0, 37.0, 60.0, 110.0, 160.0, 235.0, 356.0, 604.0, 885.0, 1563.0, 2494.0, 3972.0, 6892.0, 11570.0, 20294.0, 36413.0, 68491.0, 131573.0, 265142.0, 1237728.0, 142367.0, 74084.0, 39603.0, 21445.0, 12427.0, 7248.0, 4395.0, 2585.0, 1608.0, 1009.0, 607.0, 377.0, 249.0, 179.0, 103.0, 66.0, 36.0, 28.0, 22.0, 18.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.361328125, -0.3503990173339844, -0.33946990966796875, -0.3285408020019531, -0.3176116943359375, -0.3066825866699219, -0.29575347900390625, -0.2848243713378906, -0.273895263671875, -0.2629661560058594, -0.25203704833984375, -0.24110794067382812, -0.2301788330078125, -0.21924972534179688, -0.20832061767578125, -0.19739151000976562, -0.18646240234375, -0.17553329467773438, -0.16460418701171875, -0.15367507934570312, -0.1427459716796875, -0.13181686401367188, -0.12088775634765625, -0.10995864868164062, -0.099029541015625, -0.08810043334960938, -0.07717132568359375, -0.06624221801757812, -0.0553131103515625, -0.044384002685546875, -0.03345489501953125, -0.022525787353515625, -0.0115966796875, -0.000667572021484375, 0.01026153564453125, 0.021190643310546875, 0.0321197509765625, 0.043048858642578125, 0.05397796630859375, 0.06490707397460938, 0.075836181640625, 0.08676528930664062, 0.09769439697265625, 0.10862350463867188, 0.1195526123046875, 0.13048171997070312, 0.14141082763671875, 0.15233993530273438, 0.16326904296875, 0.17419815063476562, 0.18512725830078125, 0.19605636596679688, 0.2069854736328125, 0.21791458129882812, 0.22884368896484375, 0.23977279663085938, 0.250701904296875, 0.2616310119628906, 0.27256011962890625, 0.2834892272949219, 0.2944183349609375, 0.3053474426269531, 0.31627655029296875, 0.3272056579589844, 0.338134765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 5.0, 16.0, 11.0, 14.0, 10.0, 10.0, 24.0, 24.0, 29.0, 36.0, 39.0, 47.0, 55.0, 75.0, 72.0, 76.0, 80.0, 64.0, 59.0, 44.0, 42.0, 26.0, 27.0, 27.0, 11.0, 23.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018644332885742188, -0.0018067359924316406, -0.0017490386962890625, -0.0016913414001464844, -0.0016336441040039062, -0.0015759468078613281, -0.00151824951171875, -0.0014605522155761719, -0.0014028549194335938, -0.0013451576232910156, -0.0012874603271484375, -0.0012297630310058594, -0.0011720657348632812, -0.0011143684387207031, -0.001056671142578125, -0.0009989738464355469, -0.0009412765502929688, -0.0008835792541503906, -0.0008258819580078125, -0.0007681846618652344, -0.0007104873657226562, -0.0006527900695800781, -0.0005950927734375, -0.0005373954772949219, -0.00047969818115234375, -0.0004220008850097656, -0.0003643035888671875, -0.0003066062927246094, -0.00024890899658203125, -0.00019121170043945312, -0.000133514404296875, -7.581710815429688e-05, -1.811981201171875e-05, 3.9577484130859375e-05, 9.72747802734375e-05, 0.00015497207641601562, 0.00021266937255859375, 0.0002703666687011719, 0.00032806396484375, 0.0003857612609863281, 0.00044345855712890625, 0.0005011558532714844, 0.0005588531494140625, 0.0006165504455566406, 0.0006742477416992188, 0.0007319450378417969, 0.000789642333984375, 0.0008473396301269531, 0.0009050369262695312, 0.0009627342224121094, 0.0010204315185546875, 0.0010781288146972656, 0.0011358261108398438, 0.0011935234069824219, 0.001251220703125, 0.0013089179992675781, 0.0013666152954101562, 0.0014243125915527344, 0.0014820098876953125, 0.0015397071838378906, 0.0015974044799804688, 0.0016551017761230469, 0.001712799072265625, 0.0017704963684082031, 0.0018281936645507812]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 8.0, 6.0, 19.0, 23.0, 31.0, 34.0, 69.0, 99.0, 112.0, 163.0, 222.0, 325.0, 474.0, 1284.0, 1038664.0, 5160.0, 609.0, 354.0, 232.0, 151.0, 133.0, 103.0, 65.0, 69.0, 24.0, 26.0, 18.0, 28.0, 5.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04287576675415039, -0.04156208038330078, -0.04024839401245117, -0.03893470764160156, -0.03762102127075195, -0.036307334899902344, -0.034993648529052734, -0.033679962158203125, -0.032366275787353516, -0.031052589416503906, -0.029738903045654297, -0.028425216674804688, -0.027111530303955078, -0.02579784393310547, -0.02448415756225586, -0.02317047119140625, -0.02185678482055664, -0.02054309844970703, -0.019229412078857422, -0.017915725708007812, -0.016602039337158203, -0.015288352966308594, -0.013974666595458984, -0.012660980224609375, -0.011347293853759766, -0.010033607482910156, -0.008719921112060547, -0.0074062347412109375, -0.006092548370361328, -0.004778861999511719, -0.0034651756286621094, -0.0021514892578125, -0.0008378028869628906, 0.00047588348388671875, 0.0017895698547363281, 0.0031032562255859375, 0.004416942596435547, 0.005730628967285156, 0.007044315338134766, 0.008358001708984375, 0.009671688079833984, 0.010985374450683594, 0.012299060821533203, 0.013612747192382812, 0.014926433563232422, 0.01624011993408203, 0.01755380630493164, 0.01886749267578125, 0.02018117904663086, 0.02149486541748047, 0.022808551788330078, 0.024122238159179688, 0.025435924530029297, 0.026749610900878906, 0.028063297271728516, 0.029376983642578125, 0.030690670013427734, 0.032004356384277344, 0.03331804275512695, 0.03463172912597656, 0.03594541549682617, 0.03725910186767578, 0.03857278823852539, 0.039886474609375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1008.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006473960820585489, 0.00025259109679609537, 0.0011525782756507397, 0.002052565338090062, 0.0029525526333600283, 0.0038525399286299944, 0.004752526991069317, 0.005652514286339283, 0.006552501581609249, 0.007452488876879215, 0.008352476172149181, 0.009252462536096573, 0.010152449831366539, 0.011052437126636505, 0.011952424421906471, 0.012852411717176437, 0.013752399012446404, 0.01465238630771637, 0.015552373602986336, 0.016452360898256302, 0.017352348193526268, 0.018252335488796234, 0.01915232092142105, 0.020052310079336166, 0.020952295511960983, 0.02185228280723095, 0.022752270102500916, 0.02365225739777088, 0.024552244693040848, 0.025452231988310814, 0.02635221928358078, 0.027252204716205597, 0.028152193874120712, 0.02905218116939068, 0.029952168464660645, 0.03085215575993061, 0.03175214305520058, 0.032652128487825394, 0.03355211764574051, 0.034452103078365326, 0.03535209223628044, 0.03625207766890526, 0.037152066826820374, 0.03805205225944519, 0.038952041417360306, 0.03985202684998512, 0.04075201600790024, 0.041652001440525055, 0.04255198687314987, 0.04345197230577469, 0.044351961463689804, 0.04525194689631462, 0.046151936054229736, 0.04705192148685455, 0.04795191064476967, 0.048851896077394485, 0.0497518852353096, 0.05065187066793442, 0.05155185982584953, 0.05245184525847435, 0.053351834416389465, 0.05425181984901428, 0.0551518090069294, 0.056051794439554214, 0.05695178359746933]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 22.0, 11.0, 31.0, 39.0, 40.0, 62.0, 70.0, 77.0, 54.0, 83.0, 75.0, 79.0, 50.0, 72.0, 75.0, 43.0, 39.0, 24.0, 24.0, 18.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020893216133117676, -0.0020346548408269882, -0.001979988068342209, -0.0019253212958574295, -0.0018706545233726501, -0.0018159877508878708, -0.0017613209784030914, -0.001706654205918312, -0.0016519874334335327, -0.0015973206609487534, -0.001542653888463974, -0.0014879871159791946, -0.0014333203434944153, -0.001378653571009636, -0.0013239867985248566, -0.0012693200260400772, -0.0012146532535552979, -0.0011599864810705185, -0.0011053197085857391, -0.0010506529361009598, -0.0009959861636161804, -0.0009413193911314011, -0.0008866526186466217, -0.0008319858461618423, -0.000777319073677063, -0.0007226523011922836, -0.0006679855287075043, -0.0006133187562227249, -0.0005586519837379456, -0.0005039852112531662, -0.00044931843876838684, -0.0003946516662836075, -0.0003399848937988281, -0.00028531812131404877, -0.0002306513488292694, -0.00017598457634449005, -0.0001213178038597107, -6.665103137493134e-05, -1.1984258890151978e-05, 4.268251359462738e-05, 9.734928607940674e-05, 0.0001520160585641861, 0.00020668283104896545, 0.0002613496035337448, 0.00031601637601852417, 0.00037068314850330353, 0.0004253499209880829, 0.00048001669347286224, 0.0005346834659576416, 0.000589350238442421, 0.0006440170109272003, 0.0006986837834119797, 0.000753350555896759, 0.0008080173283815384, 0.0008626841008663177, 0.0009173508733510971, 0.0009720176458358765, 0.0010266844183206558, 0.0010813511908054352, 0.0011360179632902145, 0.001190684735774994, 0.0012453515082597733, 0.0013000182807445526, 0.001354685053229332, 0.0014093518257141113]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 14.0, 14.0, 12.0, 16.0, 17.0, 25.0, 26.0, 26.0, 26.0, 43.0, 40.0, 40.0, 49.0, 63.0, 64.0, 65.0, 65.0, 60.0, 67.0, 38.0, 34.0, 34.0, 28.0, 26.0, 19.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.9921875, -4.8699951171875, -4.747802734375, -4.6256103515625, -4.50341796875, -4.3812255859375, -4.259033203125, -4.1368408203125, -4.0146484375, -3.8924560546875, -3.770263671875, -3.6480712890625, -3.52587890625, -3.4036865234375, -3.281494140625, -3.1593017578125, -3.037109375, -2.9149169921875, -2.792724609375, -2.6705322265625, -2.54833984375, -2.4261474609375, -2.303955078125, -2.1817626953125, -2.0595703125, -1.9373779296875, -1.815185546875, -1.6929931640625, -1.57080078125, -1.4486083984375, -1.326416015625, -1.2042236328125, -1.08203125, -0.9598388671875, -0.837646484375, -0.7154541015625, -0.59326171875, -0.4710693359375, -0.348876953125, -0.2266845703125, -0.1044921875, 0.0177001953125, 0.139892578125, 0.2620849609375, 0.38427734375, 0.5064697265625, 0.628662109375, 0.7508544921875, 0.873046875, 0.9952392578125, 1.117431640625, 1.2396240234375, 1.36181640625, 1.4840087890625, 1.606201171875, 1.7283935546875, 1.8505859375, 1.9727783203125, 2.094970703125, 2.2171630859375, 2.33935546875, 2.4615478515625, 2.583740234375, 2.7059326171875, 2.828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 6.0, 22.0, 20.0, 26.0, 41.0, 70.0, 77.0, 91.0, 142.0, 198.0, 248.0, 374.0, 517.0, 776.0, 1126.0, 1690.0, 2672.0, 4374.0, 7768.0, 14682.0, 44616.0, 646530.0, 264752.0, 28594.0, 11713.0, 6518.0, 3687.0, 2340.0, 1446.0, 1032.0, 686.0, 487.0, 334.0, 239.0, 177.0, 138.0, 81.0, 77.0, 41.0, 39.0, 24.0, 28.0, 10.0, 7.0, 7.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.149169921875, -15.64208984375, -15.135009765625, -14.6279296875, -14.120849609375, -13.61376953125, -13.106689453125, -12.599609375, -12.092529296875, -11.58544921875, -11.078369140625, -10.5712890625, -10.064208984375, -9.55712890625, -9.050048828125, -8.54296875, -8.035888671875, -7.52880859375, -7.021728515625, -6.5146484375, -6.007568359375, -5.50048828125, -4.993408203125, -4.486328125, -3.979248046875, -3.47216796875, -2.965087890625, -2.4580078125, -1.950927734375, -1.44384765625, -0.936767578125, -0.4296875, 0.077392578125, 0.58447265625, 1.091552734375, 1.5986328125, 2.105712890625, 2.61279296875, 3.119873046875, 3.626953125, 4.134033203125, 4.64111328125, 5.148193359375, 5.6552734375, 6.162353515625, 6.66943359375, 7.176513671875, 7.68359375, 8.190673828125, 8.69775390625, 9.204833984375, 9.7119140625, 10.218994140625, 10.72607421875, 11.233154296875, 11.740234375, 12.247314453125, 12.75439453125, 13.261474609375, 13.7685546875, 14.275634765625, 14.78271484375, 15.289794921875, 15.796875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 4.0, 10.0, 8.0, 7.0, 19.0, 17.0, 19.0, 15.0, 29.0, 27.0, 26.0, 24.0, 31.0, 43.0, 46.0, 45.0, 67.0, 139.0, 304.0, 1485.0, 185.0, 72.0, 64.0, 45.0, 43.0, 40.0, 29.0, 31.0, 30.0, 24.0, 18.0, 19.0, 21.0, 15.0, 11.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.138916015625, -8.85595703125, -8.572998046875, -8.2900390625, -8.007080078125, -7.72412109375, -7.441162109375, -7.158203125, -6.875244140625, -6.59228515625, -6.309326171875, -6.0263671875, -5.743408203125, -5.46044921875, -5.177490234375, -4.89453125, -4.611572265625, -4.32861328125, -4.045654296875, -3.7626953125, -3.479736328125, -3.19677734375, -2.913818359375, -2.630859375, -2.347900390625, -2.06494140625, -1.781982421875, -1.4990234375, -1.216064453125, -0.93310546875, -0.650146484375, -0.3671875, -0.084228515625, 0.19873046875, 0.481689453125, 0.7646484375, 1.047607421875, 1.33056640625, 1.613525390625, 1.896484375, 2.179443359375, 2.46240234375, 2.745361328125, 3.0283203125, 3.311279296875, 3.59423828125, 3.877197265625, 4.16015625, 4.443115234375, 4.72607421875, 5.009033203125, 5.2919921875, 5.574951171875, 5.85791015625, 6.140869140625, 6.423828125, 6.706787109375, 6.98974609375, 7.272705078125, 7.5556640625, 7.838623046875, 8.12158203125, 8.404541015625, 8.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 3.0, 9.0, 5.0, 15.0, 16.0, 15.0, 16.0, 28.0, 26.0, 31.0, 32.0, 37.0, 49.0, 70.0, 126.0, 359.0, 1690.0, 609565.0, 2530616.0, 1980.0, 440.0, 171.0, 77.0, 63.0, 40.0, 25.0, 27.0, 27.0, 17.0, 20.0, 23.0, 16.0, 15.0, 9.0, 13.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.7958984375, -35.529296875, -34.2626953125, -32.99609375, -31.7294921875, -30.462890625, -29.1962890625, -27.9296875, -26.6630859375, -25.396484375, -24.1298828125, -22.86328125, -21.5966796875, -20.330078125, -19.0634765625, -17.796875, -16.5302734375, -15.263671875, -13.9970703125, -12.73046875, -11.4638671875, -10.197265625, -8.9306640625, -7.6640625, -6.3974609375, -5.130859375, -3.8642578125, -2.59765625, -1.3310546875, -0.064453125, 1.2021484375, 2.46875, 3.7353515625, 5.001953125, 6.2685546875, 7.53515625, 8.8017578125, 10.068359375, 11.3349609375, 12.6015625, 13.8681640625, 15.134765625, 16.4013671875, 17.66796875, 18.9345703125, 20.201171875, 21.4677734375, 22.734375, 24.0009765625, 25.267578125, 26.5341796875, 27.80078125, 29.0673828125, 30.333984375, 31.6005859375, 32.8671875, 34.1337890625, 35.400390625, 36.6669921875, 37.93359375, 39.2001953125, 40.466796875, 41.7333984375, 43.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 530.0, 481.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.5656433105469, -267.69378662109375, -262.8218994140625, -257.9500427246094, -253.0781707763672, -248.206298828125, -243.3344268798828, -238.46255493164062, -233.59068298339844, -228.71881103515625, -223.84693908691406, -218.97506713867188, -214.10321044921875, -209.23133850097656, -204.35946655273438, -199.4875946044922, -194.61572265625, -189.7438507080078, -184.87197875976562, -180.0001220703125, -175.1282501220703, -170.25637817382812, -165.38450622558594, -160.51263427734375, -155.64077758789062, -150.76890563964844, -145.89703369140625, -141.02517700195312, -136.15330505371094, -131.28143310546875, -126.40956115722656, -121.53768920898438, -116.66583251953125, -111.79396057128906, -106.9220962524414, -102.05022430419922, -97.17835235595703, -92.30648803710938, -87.43461608886719, -82.562744140625, -77.69087219238281, -72.81900024414062, -67.94713592529297, -63.07526397705078, -58.203392028808594, -53.33152389526367, -48.45965576171875, -43.58778381347656, -38.71591567993164, -33.84404754638672, -28.97217559814453, -24.10030746459961, -19.228437423706055, -14.3565673828125, -9.484699249267578, -4.612827301025391, 0.25904083251953125, 5.130910396575928, 10.002779960632324, 14.874649047851562, 19.746519088745117, 24.618389129638672, 29.490257263183594, 34.36212921142578, 39.2339973449707]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 9.0, 11.0, 11.0, 8.0, 11.0, 14.0, 11.0, 24.0, 26.0, 32.0, 17.0, 33.0, 27.0, 24.0, 43.0, 32.0, 34.0, 43.0, 37.0, 39.0, 35.0, 32.0, 48.0, 43.0, 38.0, 31.0, 23.0, 32.0, 23.0, 32.0, 22.0, 16.0, 30.0, 15.0, 6.0, 14.0, 15.0, 11.0, 5.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.228797912597656, -27.306621551513672, -26.384445190429688, -25.462268829345703, -24.540090560913086, -23.6179141998291, -22.695737838745117, -21.773561477661133, -20.851383209228516, -19.92920684814453, -19.007030487060547, -18.084854125976562, -17.162675857543945, -16.24049949645996, -15.318323135375977, -14.396146774291992, -13.473970413208008, -12.551794052124023, -11.629616737365723, -10.707440376281738, -9.785263061523438, -8.863086700439453, -7.940910339355469, -7.018733501434326, -6.096556663513184, -5.174379825592041, -4.252202987670898, -3.330026626586914, -2.4078497886657715, -1.485672950744629, -0.5634965896606445, 0.35868024826049805, 1.2808570861816406, 2.203033924102783, 3.1252105236053467, 4.04738712310791, 4.969563961029053, 5.891740798950195, 6.81391716003418, 7.736093997955322, 8.658270835876465, 9.58044719696045, 10.50262451171875, 11.424800872802734, 12.346977233886719, 13.26915454864502, 14.191330909729004, 15.113508224487305, 16.03568458557129, 16.957860946655273, 17.880037307739258, 18.802215576171875, 19.72439193725586, 20.646568298339844, 21.568744659423828, 22.490921020507812, 23.413097381591797, 24.33527374267578, 25.257450103759766, 26.17962646484375, 27.101804733276367, 28.02398109436035, 28.946157455444336, 29.86833381652832, 30.790512084960938]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 4.0, 10.0, 13.0, 9.0, 12.0, 14.0, 26.0, 24.0, 26.0, 34.0, 34.0, 31.0, 29.0, 49.0, 47.0, 61.0, 67.0, 57.0, 71.0, 54.0, 61.0, 48.0, 34.0, 25.0, 33.0, 18.0, 23.0, 22.0, 12.0, 15.0, 12.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.90625, -4.779541015625, -4.65283203125, -4.526123046875, -4.3994140625, -4.272705078125, -4.14599609375, -4.019287109375, -3.892578125, -3.765869140625, -3.63916015625, -3.512451171875, -3.3857421875, -3.259033203125, -3.13232421875, -3.005615234375, -2.87890625, -2.752197265625, -2.62548828125, -2.498779296875, -2.3720703125, -2.245361328125, -2.11865234375, -1.991943359375, -1.865234375, -1.738525390625, -1.61181640625, -1.485107421875, -1.3583984375, -1.231689453125, -1.10498046875, -0.978271484375, -0.8515625, -0.724853515625, -0.59814453125, -0.471435546875, -0.3447265625, -0.218017578125, -0.09130859375, 0.035400390625, 0.162109375, 0.288818359375, 0.41552734375, 0.542236328125, 0.6689453125, 0.795654296875, 0.92236328125, 1.049072265625, 1.17578125, 1.302490234375, 1.42919921875, 1.555908203125, 1.6826171875, 1.809326171875, 1.93603515625, 2.062744140625, 2.189453125, 2.316162109375, 2.44287109375, 2.569580078125, 2.6962890625, 2.822998046875, 2.94970703125, 3.076416015625, 3.203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 6.0, 6.0, 14.0, 24.0, 24.0, 30.0, 58.0, 77.0, 102.0, 154.0, 281.0, 514.0, 930.0, 1923.0, 4757.0, 13803.0, 60827.0, 1049947.0, 2901525.0, 125747.0, 21171.0, 6680.0, 2701.0, 1324.0, 650.0, 363.0, 218.0, 133.0, 88.0, 60.0, 38.0, 31.0, 20.0, 21.0, 11.0, 9.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.25, -20.66259765625, -20.0751953125, -19.48779296875, -18.900390625, -18.31298828125, -17.7255859375, -17.13818359375, -16.55078125, -15.96337890625, -15.3759765625, -14.78857421875, -14.201171875, -13.61376953125, -13.0263671875, -12.43896484375, -11.8515625, -11.26416015625, -10.6767578125, -10.08935546875, -9.501953125, -8.91455078125, -8.3271484375, -7.73974609375, -7.15234375, -6.56494140625, -5.9775390625, -5.39013671875, -4.802734375, -4.21533203125, -3.6279296875, -3.04052734375, -2.453125, -1.86572265625, -1.2783203125, -0.69091796875, -0.103515625, 0.48388671875, 1.0712890625, 1.65869140625, 2.24609375, 2.83349609375, 3.4208984375, 4.00830078125, 4.595703125, 5.18310546875, 5.7705078125, 6.35791015625, 6.9453125, 7.53271484375, 8.1201171875, 8.70751953125, 9.294921875, 9.88232421875, 10.4697265625, 11.05712890625, 11.64453125, 12.23193359375, 12.8193359375, 13.40673828125, 13.994140625, 14.58154296875, 15.1689453125, 15.75634765625, 16.34375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 8.0, 16.0, 29.0, 31.0, 65.0, 61.0, 94.0, 152.0, 259.0, 369.0, 574.0, 680.0, 592.0, 363.0, 236.0, 161.0, 130.0, 77.0, 46.0, 35.0, 30.0, 20.0, 11.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.474853515625, -14.93408203125, -14.393310546875, -13.8525390625, -13.311767578125, -12.77099609375, -12.230224609375, -11.689453125, -11.148681640625, -10.60791015625, -10.067138671875, -9.5263671875, -8.985595703125, -8.44482421875, -7.904052734375, -7.36328125, -6.822509765625, -6.28173828125, -5.740966796875, -5.2001953125, -4.659423828125, -4.11865234375, -3.577880859375, -3.037109375, -2.496337890625, -1.95556640625, -1.414794921875, -0.8740234375, -0.333251953125, 0.20751953125, 0.748291015625, 1.2890625, 1.829833984375, 2.37060546875, 2.911376953125, 3.4521484375, 3.992919921875, 4.53369140625, 5.074462890625, 5.615234375, 6.156005859375, 6.69677734375, 7.237548828125, 7.7783203125, 8.319091796875, 8.85986328125, 9.400634765625, 9.94140625, 10.482177734375, 11.02294921875, 11.563720703125, 12.1044921875, 12.645263671875, 13.18603515625, 13.726806640625, 14.267578125, 14.808349609375, 15.34912109375, 15.889892578125, 16.4306640625, 16.971435546875, 17.51220703125, 18.052978515625, 18.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 6.0, 3.0, 8.0, 8.0, 16.0, 17.0, 16.0, 27.0, 43.0, 57.0, 75.0, 125.0, 230.0, 468.0, 1557.0, 26131.0, 4121096.0, 41456.0, 1770.0, 517.0, 242.0, 149.0, 88.0, 51.0, 43.0, 26.0, 16.0, 15.0, 13.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -43.65576171875, -41.5302734375, -39.40478515625, -37.279296875, -35.15380859375, -33.0283203125, -30.90283203125, -28.77734375, -26.65185546875, -24.5263671875, -22.40087890625, -20.275390625, -18.14990234375, -16.0244140625, -13.89892578125, -11.7734375, -9.64794921875, -7.5224609375, -5.39697265625, -3.271484375, -1.14599609375, 0.9794921875, 3.10498046875, 5.23046875, 7.35595703125, 9.4814453125, 11.60693359375, 13.732421875, 15.85791015625, 17.9833984375, 20.10888671875, 22.234375, 24.35986328125, 26.4853515625, 28.61083984375, 30.736328125, 32.86181640625, 34.9873046875, 37.11279296875, 39.23828125, 41.36376953125, 43.4892578125, 45.61474609375, 47.740234375, 49.86572265625, 51.9912109375, 54.11669921875, 56.2421875, 58.36767578125, 60.4931640625, 62.61865234375, 64.744140625, 66.86962890625, 68.9951171875, 71.12060546875, 73.24609375, 75.37158203125, 77.4970703125, 79.62255859375, 81.748046875, 83.87353515625, 85.9990234375, 88.12451171875, 90.25]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [3.0, 6.0, 40.0, 255.0, 494.0, 200.0, 18.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.083255767822266, -16.30394744873047, -11.524641036987305, -6.745333671569824, -1.9660263061523438, 2.813282012939453, 7.592588424682617, 12.371894836425781, 17.151203155517578, 21.930511474609375, 26.70981788635254, 31.489124298095703, 36.2684326171875, 41.0477409362793, 45.827049255371094, 50.606353759765625, 55.38566207885742, 60.16497039794922, 64.94427490234375, 69.72358703613281, 74.50289154052734, 79.28219604492188, 84.06150817871094, 88.84081268310547, 93.6201171875, 98.39942169189453, 103.1787338256836, 107.95803833007812, 112.73735046386719, 117.51665496826172, 122.29595947265625, 127.07527160644531, 131.85458374023438, 136.63389587402344, 141.41319274902344, 146.1925048828125, 150.97181701660156, 155.75112915039062, 160.53042602539062, 165.3097381591797, 170.08905029296875, 174.8683624267578, 179.6476593017578, 184.42697143554688, 189.20628356933594, 193.985595703125, 198.764892578125, 203.54420471191406, 208.32350158691406, 213.10281372070312, 217.88211059570312, 222.6614227294922, 227.44073486328125, 232.22003173828125, 236.9993438720703, 241.77865600585938, 246.55795288085938, 251.33726501464844, 256.1165771484375, 260.8958740234375, 265.6751708984375, 270.4544982910156, 275.2337951660156, 280.0130920410156, 284.79241943359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 5.0, 13.0, 8.0, 12.0, 29.0, 24.0, 19.0, 29.0, 32.0, 37.0, 27.0, 40.0, 28.0, 34.0, 42.0, 41.0, 45.0, 39.0, 49.0, 36.0, 42.0, 31.0, 31.0, 36.0, 26.0, 35.0, 29.0, 24.0, 25.0, 24.0, 21.0, 13.0, 10.0, 12.0, 8.0, 8.0, 1.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-46.40675354003906, -45.116554260253906, -43.826358795166016, -42.53615951538086, -41.24596405029297, -39.95576477050781, -38.66556930541992, -37.375370025634766, -36.085174560546875, -34.79497528076172, -33.50477981567383, -32.21458053588867, -30.92438507080078, -29.634185791015625, -28.3439884185791, -27.053791046142578, -25.763591766357422, -24.4733943939209, -23.183197021484375, -21.89299964904785, -20.602802276611328, -19.312602996826172, -18.02240562438965, -16.732208251953125, -15.442010879516602, -14.151813507080078, -12.861616134643555, -11.571417808532715, -10.281220436096191, -8.991023063659668, -7.700825214385986, -6.410627365112305, -5.120429992675781, -3.8302323818206787, -2.540034770965576, -1.2498371601104736, 0.040360450744628906, 1.3305578231811523, 2.620755672454834, 3.9109535217285156, 5.201150894165039, 6.4913482666015625, 7.781546115875244, 9.071743965148926, 10.36194133758545, 11.652138710021973, 12.942337036132812, 14.232534408569336, 15.52273178100586, 16.812929153442383, 18.103126525878906, 19.39332389831543, 20.683521270751953, 21.97372055053711, 23.263917922973633, 24.554115295410156, 25.84431266784668, 27.134510040283203, 28.424707412719727, 29.71490478515625, 31.005104064941406, 32.2952995300293, 33.58549880981445, 34.875694274902344, 36.1658935546875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 3.0, 10.0, 11.0, 9.0, 14.0, 13.0, 14.0, 19.0, 28.0, 26.0, 30.0, 27.0, 32.0, 47.0, 42.0, 43.0, 51.0, 50.0, 67.0, 49.0, 50.0, 45.0, 53.0, 40.0, 35.0, 33.0, 28.0, 25.0, 22.0, 9.0, 22.0, 7.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.49609375, -4.37762451171875, -4.2591552734375, -4.14068603515625, -4.022216796875, -3.90374755859375, -3.7852783203125, -3.66680908203125, -3.54833984375, -3.42987060546875, -3.3114013671875, -3.19293212890625, -3.074462890625, -2.95599365234375, -2.8375244140625, -2.71905517578125, -2.6005859375, -2.48211669921875, -2.3636474609375, -2.24517822265625, -2.126708984375, -2.00823974609375, -1.8897705078125, -1.77130126953125, -1.65283203125, -1.53436279296875, -1.4158935546875, -1.29742431640625, -1.178955078125, -1.06048583984375, -0.9420166015625, -0.82354736328125, -0.705078125, -0.58660888671875, -0.4681396484375, -0.34967041015625, -0.231201171875, -0.11273193359375, 0.0057373046875, 0.12420654296875, 0.24267578125, 0.36114501953125, 0.4796142578125, 0.59808349609375, 0.716552734375, 0.83502197265625, 0.9534912109375, 1.07196044921875, 1.1904296875, 1.30889892578125, 1.4273681640625, 1.54583740234375, 1.664306640625, 1.78277587890625, 1.9012451171875, 2.01971435546875, 2.13818359375, 2.25665283203125, 2.3751220703125, 2.49359130859375, 2.612060546875, 2.73052978515625, 2.8489990234375, 2.96746826171875, 3.0859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 13.0, 6.0, 23.0, 19.0, 39.0, 53.0, 77.0, 116.0, 183.0, 284.0, 474.0, 747.0, 1227.0, 2047.0, 3547.0, 6184.0, 11355.0, 21021.0, 41068.0, 86923.0, 200200.0, 325293.0, 184761.0, 79960.0, 38326.0, 19745.0, 10609.0, 5810.0, 3377.0, 1961.0, 1163.0, 685.0, 451.0, 260.0, 190.0, 104.0, 77.0, 55.0, 29.0, 30.0, 15.0, 11.0, 13.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.669921875, -0.6492767333984375, -0.628631591796875, -0.6079864501953125, -0.58734130859375, -0.5666961669921875, -0.546051025390625, -0.5254058837890625, -0.5047607421875, -0.4841156005859375, -0.463470458984375, -0.4428253173828125, -0.42218017578125, -0.4015350341796875, -0.380889892578125, -0.3602447509765625, -0.339599609375, -0.3189544677734375, -0.298309326171875, -0.2776641845703125, -0.25701904296875, -0.2363739013671875, -0.215728759765625, -0.1950836181640625, -0.1744384765625, -0.1537933349609375, -0.133148193359375, -0.1125030517578125, -0.09185791015625, -0.0712127685546875, -0.050567626953125, -0.0299224853515625, -0.00927734375, 0.0113677978515625, 0.032012939453125, 0.0526580810546875, 0.07330322265625, 0.0939483642578125, 0.114593505859375, 0.1352386474609375, 0.1558837890625, 0.1765289306640625, 0.197174072265625, 0.2178192138671875, 0.23846435546875, 0.2591094970703125, 0.279754638671875, 0.3003997802734375, 0.321044921875, 0.3416900634765625, 0.362335205078125, 0.3829803466796875, 0.40362548828125, 0.4242706298828125, 0.444915771484375, 0.4655609130859375, 0.4862060546875, 0.5068511962890625, 0.527496337890625, 0.5481414794921875, 0.56878662109375, 0.5894317626953125, 0.610076904296875, 0.6307220458984375, 0.6513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 8.0, 14.0, 22.0, 20.0, 25.0, 29.0, 26.0, 37.0, 41.0, 37.0, 42.0, 43.0, 32.0, 41.0, 1070.0, 48.0, 40.0, 47.0, 43.0, 51.0, 32.0, 26.0, 38.0, 34.0, 14.0, 26.0, 20.0, 12.0, 17.0, 16.0, 7.0, 10.0, 7.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.646484375, -2.5726318359375, -2.498779296875, -2.4249267578125, -2.35107421875, -2.2772216796875, -2.203369140625, -2.1295166015625, -2.0556640625, -1.9818115234375, -1.907958984375, -1.8341064453125, -1.76025390625, -1.6864013671875, -1.612548828125, -1.5386962890625, -1.46484375, -1.3909912109375, -1.317138671875, -1.2432861328125, -1.16943359375, -1.0955810546875, -1.021728515625, -0.9478759765625, -0.8740234375, -0.8001708984375, -0.726318359375, -0.6524658203125, -0.57861328125, -0.5047607421875, -0.430908203125, -0.3570556640625, -0.283203125, -0.2093505859375, -0.135498046875, -0.0616455078125, 0.01220703125, 0.0860595703125, 0.159912109375, 0.2337646484375, 0.3076171875, 0.3814697265625, 0.455322265625, 0.5291748046875, 0.60302734375, 0.6768798828125, 0.750732421875, 0.8245849609375, 0.8984375, 0.9722900390625, 1.046142578125, 1.1199951171875, 1.19384765625, 1.2677001953125, 1.341552734375, 1.4154052734375, 1.4892578125, 1.5631103515625, 1.636962890625, 1.7108154296875, 1.78466796875, 1.8585205078125, 1.932373046875, 2.0062255859375, 2.080078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 26.0, 23.0, 39.0, 70.0, 110.0, 160.0, 255.0, 354.0, 612.0, 1009.0, 1554.0, 2522.0, 4265.0, 7103.0, 11614.0, 20325.0, 36282.0, 65720.0, 121570.0, 211293.0, 1277478.0, 149742.0, 80383.0, 44400.0, 24601.0, 14130.0, 8389.0, 4950.0, 3010.0, 1829.0, 1257.0, 746.0, 461.0, 305.0, 176.0, 126.0, 77.0, 48.0, 36.0, 23.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3584785461425781, -0.34659576416015625, -0.3347129821777344, -0.3228302001953125, -0.3109474182128906, -0.29906463623046875, -0.2871818542480469, -0.275299072265625, -0.2634162902832031, -0.25153350830078125, -0.23965072631835938, -0.2277679443359375, -0.21588516235351562, -0.20400238037109375, -0.19211959838867188, -0.18023681640625, -0.16835403442382812, -0.15647125244140625, -0.14458847045898438, -0.1327056884765625, -0.12082290649414062, -0.10894012451171875, -0.09705734252929688, -0.085174560546875, -0.07329177856445312, -0.06140899658203125, -0.049526214599609375, -0.0376434326171875, -0.025760650634765625, -0.01387786865234375, -0.001995086669921875, 0.0098876953125, 0.021770477294921875, 0.03365325927734375, 0.045536041259765625, 0.0574188232421875, 0.06930160522460938, 0.08118438720703125, 0.09306716918945312, 0.104949951171875, 0.11683273315429688, 0.12871551513671875, 0.14059829711914062, 0.1524810791015625, 0.16436386108398438, 0.17624664306640625, 0.18812942504882812, 0.20001220703125, 0.21189498901367188, 0.22377777099609375, 0.23566055297851562, 0.2475433349609375, 0.2594261169433594, 0.27130889892578125, 0.2831916809082031, 0.295074462890625, 0.3069572448730469, 0.31884002685546875, 0.3307228088378906, 0.3426055908203125, 0.3544883728027344, 0.36637115478515625, 0.3782539367675781, 0.39013671875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 6.0, 8.0, 11.0, 8.0, 8.0, 14.0, 22.0, 31.0, 47.0, 64.0, 81.0, 91.0, 113.0, 88.0, 104.0, 78.0, 53.0, 48.0, 26.0, 15.0, 17.0, 13.0, 9.0, 5.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.0024057626724243164, -0.002328157424926758, -0.0022505521774291992, -0.0021729469299316406, -0.002095341682434082, -0.0020177364349365234, -0.0019401311874389648, -0.0018625259399414062, -0.0017849206924438477, -0.001707315444946289, -0.0016297101974487305, -0.0015521049499511719, -0.0014744997024536133, -0.0013968944549560547, -0.001319289207458496, -0.0012416839599609375, -0.001164078712463379, -0.0010864734649658203, -0.0010088682174682617, -0.0009312629699707031, -0.0008536577224731445, -0.0007760524749755859, -0.0006984472274780273, -0.0006208419799804688, -0.0005432367324829102, -0.00046563148498535156, -0.00038802623748779297, -0.0003104209899902344, -0.00023281574249267578, -0.0001552104949951172, -7.76052474975586e-05, 0.0, 7.76052474975586e-05, 0.0001552104949951172, 0.00023281574249267578, 0.0003104209899902344, 0.00038802623748779297, 0.00046563148498535156, 0.0005432367324829102, 0.0006208419799804688, 0.0006984472274780273, 0.0007760524749755859, 0.0008536577224731445, 0.0009312629699707031, 0.0010088682174682617, 0.0010864734649658203, 0.001164078712463379, 0.0012416839599609375, 0.001319289207458496, 0.0013968944549560547, 0.0014744997024536133, 0.0015521049499511719, 0.0016297101974487305, 0.001707315444946289, 0.0017849206924438477, 0.0018625259399414062, 0.0019401311874389648, 0.0020177364349365234, 0.002095341682434082, 0.0021729469299316406, 0.0022505521774291992, 0.002328157424926758, 0.0024057626724243164, 0.002483367919921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 6.0, 10.0, 11.0, 18.0, 17.0, 21.0, 34.0, 25.0, 58.0, 99.0, 184.0, 357.0, 876.0, 1039773.0, 5860.0, 549.0, 222.0, 103.0, 81.0, 58.0, 40.0, 30.0, 17.0, 13.0, 22.0, 12.0, 10.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.057647705078125, -0.0557103157043457, -0.053772926330566406, -0.05183553695678711, -0.04989814758300781, -0.047960758209228516, -0.04602336883544922, -0.04408597946166992, -0.042148590087890625, -0.04021120071411133, -0.03827381134033203, -0.036336421966552734, -0.03439903259277344, -0.03246164321899414, -0.030524253845214844, -0.028586864471435547, -0.02664947509765625, -0.024712085723876953, -0.022774696350097656, -0.02083730697631836, -0.018899917602539062, -0.016962528228759766, -0.015025138854980469, -0.013087749481201172, -0.011150360107421875, -0.009212970733642578, -0.007275581359863281, -0.005338191986083984, -0.0034008026123046875, -0.0014634132385253906, 0.00047397613525390625, 0.002411365509033203, 0.0043487548828125, 0.006286144256591797, 0.008223533630371094, 0.01016092300415039, 0.012098312377929688, 0.014035701751708984, 0.01597309112548828, 0.017910480499267578, 0.019847869873046875, 0.021785259246826172, 0.02372264862060547, 0.025660037994384766, 0.027597427368164062, 0.02953481674194336, 0.031472206115722656, 0.03340959548950195, 0.03534698486328125, 0.03728437423706055, 0.039221763610839844, 0.04115915298461914, 0.04309654235839844, 0.045033931732177734, 0.04697132110595703, 0.04890871047973633, 0.050846099853515625, 0.05278348922729492, 0.05472087860107422, 0.056658267974853516, 0.05859565734863281, 0.06053304672241211, 0.062470436096191406, 0.0644078254699707, 0.06634521484375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1020.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004157747142016888, -0.0025714323855936527, -0.0009851173963397741, 0.0006011975929141045, 0.0021875123493373394, 0.0037738271057605743, 0.005360142327845097, 0.006946456618607044, 0.008532771840691566, 0.010119087062776089, 0.011705401353538036, 0.013291716575622559, 0.014878030866384506, 0.016464345157146454, 0.01805066131055355, 0.0196369756013155, 0.021223291754722595, 0.022809606045484543, 0.02439592219889164, 0.025982236489653587, 0.027568550780415535, 0.029154866933822632, 0.03074118122458458, 0.03232749551534653, 0.033913809806108475, 0.03550012409687042, 0.03708643838763237, 0.03867275267839432, 0.040259070694446564, 0.04184538498520851, 0.04343169927597046, 0.04501801356673241, 0.04660433158278465, 0.0481906458735466, 0.04977696016430855, 0.051363274455070496, 0.05294959247112274, 0.05453590676188469, 0.05612222105264664, 0.057708535343408585, 0.05929484963417053, 0.06088116392493248, 0.06246747821569443, 0.06405379623174667, 0.06564010679721832, 0.06722642481327057, 0.06881274282932281, 0.07039905339479446, 0.07198537141084671, 0.07357168942689896, 0.0751579999923706, 0.07674431800842285, 0.0783306285738945, 0.07991694658994675, 0.0815032571554184, 0.08308957517147064, 0.08467588573694229, 0.08626220375299454, 0.08784851431846619, 0.08943483233451843, 0.09102114289999008, 0.09260746091604233, 0.09419377148151398, 0.09578008949756622, 0.09736640751361847]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 13.0, 17.0, 17.0, 25.0, 32.0, 38.0, 59.0, 46.0, 69.0, 64.0, 81.0, 68.0, 65.0, 75.0, 67.0, 54.0, 42.0, 42.0, 28.0, 33.0, 18.0, 16.0, 12.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0023022890090942383, -0.0022492017596960068, -0.0021961145102977753, -0.0021430272608995438, -0.0020899400115013123, -0.0020368527621030807, -0.0019837655127048492, -0.0019306782633066177, -0.0018775910139083862, -0.0018245037645101547, -0.0017714165151119232, -0.0017183292657136917, -0.0016652420163154602, -0.0016121547669172287, -0.0015590675175189972, -0.0015059802681207657, -0.0014528930187225342, -0.0013998057693243027, -0.0013467185199260712, -0.0012936312705278397, -0.0012405440211296082, -0.0011874567717313766, -0.0011343695223331451, -0.0010812822729349136, -0.0010281950235366821, -0.0009751077741384506, -0.0009220205247402191, -0.0008689332753419876, -0.0008158460259437561, -0.0007627587765455246, -0.0007096715271472931, -0.0006565842777490616, -0.0006034970283508301, -0.0005504097789525986, -0.0004973225295543671, -0.00044423528015613556, -0.00039114803075790405, -0.00033806078135967255, -0.00028497353196144104, -0.00023188628256320953, -0.00017879903316497803, -0.00012571178376674652, -7.262453436851501e-05, -1.9537284970283508e-05, 3.3549964427948e-05, 8.66372138261795e-05, 0.000139724463224411, 0.00019281171262264252, 0.000245898962020874, 0.00029898621141910553, 0.00035207346081733704, 0.00040516071021556854, 0.00045824795961380005, 0.0005113352090120316, 0.0005644224584102631, 0.0006175097078084946, 0.0006705969572067261, 0.0007236842066049576, 0.0007767714560031891, 0.0008298587054014206, 0.0008829459547996521, 0.0009360332041978836, 0.0009891204535961151, 0.0010422077029943466, 0.0010952949523925781]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 3.0, 10.0, 11.0, 9.0, 14.0, 13.0, 14.0, 19.0, 28.0, 26.0, 30.0, 27.0, 32.0, 47.0, 42.0, 43.0, 51.0, 50.0, 67.0, 49.0, 50.0, 45.0, 53.0, 40.0, 35.0, 33.0, 28.0, 25.0, 22.0, 9.0, 22.0, 7.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.49609375, -4.37762451171875, -4.2591552734375, -4.14068603515625, -4.022216796875, -3.90374755859375, -3.7852783203125, -3.66680908203125, -3.54833984375, -3.42987060546875, -3.3114013671875, -3.19293212890625, -3.074462890625, -2.95599365234375, -2.8375244140625, -2.71905517578125, -2.6005859375, -2.48211669921875, -2.3636474609375, -2.24517822265625, -2.126708984375, -2.00823974609375, -1.8897705078125, -1.77130126953125, -1.65283203125, -1.53436279296875, -1.4158935546875, -1.29742431640625, -1.178955078125, -1.06048583984375, -0.9420166015625, -0.82354736328125, -0.705078125, -0.58660888671875, -0.4681396484375, -0.34967041015625, -0.231201171875, -0.11273193359375, 0.0057373046875, 0.12420654296875, 0.24267578125, 0.36114501953125, 0.4796142578125, 0.59808349609375, 0.716552734375, 0.83502197265625, 0.9534912109375, 1.07196044921875, 1.1904296875, 1.30889892578125, 1.4273681640625, 1.54583740234375, 1.664306640625, 1.78277587890625, 1.9012451171875, 2.01971435546875, 2.13818359375, 2.25665283203125, 2.3751220703125, 2.49359130859375, 2.612060546875, 2.73052978515625, 2.8489990234375, 2.96746826171875, 3.0859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 8.0, 8.0, 5.0, 16.0, 34.0, 34.0, 58.0, 69.0, 99.0, 139.0, 255.0, 349.0, 672.0, 1421.0, 3299.0, 9388.0, 31628.0, 124581.0, 467862.0, 304425.0, 73147.0, 19804.0, 6328.0, 2432.0, 1048.0, 542.0, 305.0, 187.0, 118.0, 79.0, 63.0, 52.0, 32.0, 21.0, 11.0, 14.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.4617919921875, -4.329833984375, -4.1978759765625, -4.06591796875, -3.9339599609375, -3.802001953125, -3.6700439453125, -3.5380859375, -3.4061279296875, -3.274169921875, -3.1422119140625, -3.01025390625, -2.8782958984375, -2.746337890625, -2.6143798828125, -2.482421875, -2.3504638671875, -2.218505859375, -2.0865478515625, -1.95458984375, -1.8226318359375, -1.690673828125, -1.5587158203125, -1.4267578125, -1.2947998046875, -1.162841796875, -1.0308837890625, -0.89892578125, -0.7669677734375, -0.635009765625, -0.5030517578125, -0.37109375, -0.2391357421875, -0.107177734375, 0.0247802734375, 0.15673828125, 0.2886962890625, 0.420654296875, 0.5526123046875, 0.6845703125, 0.8165283203125, 0.948486328125, 1.0804443359375, 1.21240234375, 1.3443603515625, 1.476318359375, 1.6082763671875, 1.740234375, 1.8721923828125, 2.004150390625, 2.1361083984375, 2.26806640625, 2.4000244140625, 2.531982421875, 2.6639404296875, 2.7958984375, 2.9278564453125, 3.059814453125, 3.1917724609375, 3.32373046875, 3.4556884765625, 3.587646484375, 3.7196044921875, 3.8515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 14.0, 6.0, 5.0, 8.0, 9.0, 20.0, 14.0, 14.0, 21.0, 27.0, 30.0, 24.0, 39.0, 33.0, 30.0, 48.0, 50.0, 76.0, 133.0, 1613.0, 322.0, 86.0, 37.0, 33.0, 41.0, 40.0, 30.0, 27.0, 24.0, 25.0, 23.0, 23.0, 19.0, 19.0, 19.0, 8.0, 13.0, 10.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-11.375, -11.0380859375, -10.701171875, -10.3642578125, -10.02734375, -9.6904296875, -9.353515625, -9.0166015625, -8.6796875, -8.3427734375, -8.005859375, -7.6689453125, -7.33203125, -6.9951171875, -6.658203125, -6.3212890625, -5.984375, -5.6474609375, -5.310546875, -4.9736328125, -4.63671875, -4.2998046875, -3.962890625, -3.6259765625, -3.2890625, -2.9521484375, -2.615234375, -2.2783203125, -1.94140625, -1.6044921875, -1.267578125, -0.9306640625, -0.59375, -0.2568359375, 0.080078125, 0.4169921875, 0.75390625, 1.0908203125, 1.427734375, 1.7646484375, 2.1015625, 2.4384765625, 2.775390625, 3.1123046875, 3.44921875, 3.7861328125, 4.123046875, 4.4599609375, 4.796875, 5.1337890625, 5.470703125, 5.8076171875, 6.14453125, 6.4814453125, 6.818359375, 7.1552734375, 7.4921875, 7.8291015625, 8.166015625, 8.5029296875, 8.83984375, 9.1767578125, 9.513671875, 9.8505859375, 10.1875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 13.0, 8.0, 18.0, 20.0, 24.0, 12.0, 27.0, 23.0, 34.0, 42.0, 49.0, 79.0, 109.0, 149.0, 359.0, 1111.0, 17289.0, 3096045.0, 27944.0, 1233.0, 394.0, 194.0, 111.0, 77.0, 51.0, 49.0, 27.0, 32.0, 24.0, 28.0, 12.0, 20.0, 10.0, 10.0, 8.0, 5.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-21.890625, -21.149658203125, -20.40869140625, -19.667724609375, -18.9267578125, -18.185791015625, -17.44482421875, -16.703857421875, -15.962890625, -15.221923828125, -14.48095703125, -13.739990234375, -12.9990234375, -12.258056640625, -11.51708984375, -10.776123046875, -10.03515625, -9.294189453125, -8.55322265625, -7.812255859375, -7.0712890625, -6.330322265625, -5.58935546875, -4.848388671875, -4.107421875, -3.366455078125, -2.62548828125, -1.884521484375, -1.1435546875, -0.402587890625, 0.33837890625, 1.079345703125, 1.8203125, 2.561279296875, 3.30224609375, 4.043212890625, 4.7841796875, 5.525146484375, 6.26611328125, 7.007080078125, 7.748046875, 8.489013671875, 9.22998046875, 9.970947265625, 10.7119140625, 11.452880859375, 12.19384765625, 12.934814453125, 13.67578125, 14.416748046875, 15.15771484375, 15.898681640625, 16.6396484375, 17.380615234375, 18.12158203125, 18.862548828125, 19.603515625, 20.344482421875, 21.08544921875, 21.826416015625, 22.5673828125, 23.308349609375, 24.04931640625, 24.790283203125, 25.53125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 12.0, 286.0, 639.0, 77.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.906078338623047, -4.106780052185059, -2.307481288909912, -0.5081825256347656, 1.2911157608032227, 3.090414047241211, 4.889713287353516, 6.689011573791504, 8.488309860229492, 10.28760814666748, 12.086906433105469, 13.886205673217773, 15.685503959655762, 17.48480224609375, 19.284101486206055, 21.08340072631836, 22.88269805908203, 24.681997299194336, 26.481294631958008, 28.280593872070312, 30.079891204833984, 31.87919044494629, 33.678489685058594, 35.477787017822266, 37.27708435058594, 39.07638168334961, 40.87568283081055, 42.67498016357422, 44.47427749633789, 46.27357482910156, 48.0728759765625, 49.87217330932617, 51.671478271484375, 53.47077560424805, 55.270076751708984, 57.069374084472656, 58.86867141723633, 60.66796875, 62.46726989746094, 64.26657104492188, 66.06586456298828, 67.86516571044922, 69.66445922851562, 71.46376037597656, 73.2630615234375, 75.0623550415039, 76.86165618896484, 78.66095733642578, 80.46025085449219, 82.25955200195312, 84.05884552001953, 85.85814666748047, 87.6574478149414, 89.45674133300781, 91.25604248046875, 93.05534362792969, 94.85464477539062, 96.65394592285156, 98.45323944091797, 100.2525405883789, 102.05184173583984, 103.85113525390625, 105.65043640136719, 107.44973754882812, 109.24903106689453]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 7.0, 10.0, 15.0, 14.0, 22.0, 24.0, 31.0, 33.0, 39.0, 34.0, 44.0, 25.0, 46.0, 41.0, 35.0, 50.0, 44.0, 45.0, 44.0, 45.0, 45.0, 33.0, 37.0, 31.0, 20.0, 25.0, 19.0, 23.0, 20.0, 23.0, 9.0, 10.0, 8.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.88740921020508, -36.67438507080078, -35.461360931396484, -34.24833679199219, -33.03531265258789, -31.822288513183594, -30.609264373779297, -29.396240234375, -28.183216094970703, -26.970191955566406, -25.75716781616211, -24.544143676757812, -23.331119537353516, -22.11809539794922, -20.905071258544922, -19.692047119140625, -18.479022979736328, -17.26599884033203, -16.052974700927734, -14.839950561523438, -13.62692642211914, -12.413902282714844, -11.200878143310547, -9.98785400390625, -8.774829864501953, -7.561805725097656, -6.348781585693359, -5.1357574462890625, -3.9227333068847656, -2.7097091674804688, -1.4966850280761719, -0.283660888671875, 0.9293594360351562, 2.142383575439453, 3.35540771484375, 4.568431854248047, 5.781455993652344, 6.994480133056641, 8.207504272460938, 9.420528411865234, 10.633552551269531, 11.846576690673828, 13.059600830078125, 14.272624969482422, 15.485649108886719, 16.698673248291016, 17.911697387695312, 19.12472152709961, 20.337745666503906, 21.550769805908203, 22.7637939453125, 23.976818084716797, 25.189842224121094, 26.40286636352539, 27.615890502929688, 28.828914642333984, 30.04193878173828, 31.254962921142578, 32.467987060546875, 33.68101119995117, 34.89403533935547, 36.107059478759766, 37.32008361816406, 38.53310775756836, 39.746131896972656]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 11.0, 7.0, 11.0, 17.0, 14.0, 16.0, 18.0, 32.0, 30.0, 33.0, 24.0, 45.0, 41.0, 48.0, 38.0, 53.0, 61.0, 53.0, 51.0, 50.0, 50.0, 37.0, 36.0, 37.0, 33.0, 31.0, 15.0, 17.0, 13.0, 16.0, 4.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.5, -4.3792724609375, -4.258544921875, -4.1378173828125, -4.01708984375, -3.8963623046875, -3.775634765625, -3.6549072265625, -3.5341796875, -3.4134521484375, -3.292724609375, -3.1719970703125, -3.05126953125, -2.9305419921875, -2.809814453125, -2.6890869140625, -2.568359375, -2.4476318359375, -2.326904296875, -2.2061767578125, -2.08544921875, -1.9647216796875, -1.843994140625, -1.7232666015625, -1.6025390625, -1.4818115234375, -1.361083984375, -1.2403564453125, -1.11962890625, -0.9989013671875, -0.878173828125, -0.7574462890625, -0.63671875, -0.5159912109375, -0.395263671875, -0.2745361328125, -0.15380859375, -0.0330810546875, 0.087646484375, 0.2083740234375, 0.3291015625, 0.4498291015625, 0.570556640625, 0.6912841796875, 0.81201171875, 0.9327392578125, 1.053466796875, 1.1741943359375, 1.294921875, 1.4156494140625, 1.536376953125, 1.6571044921875, 1.77783203125, 1.8985595703125, 2.019287109375, 2.1400146484375, 2.2607421875, 2.3814697265625, 2.502197265625, 2.6229248046875, 2.74365234375, 2.8643798828125, 2.985107421875, 3.1058349609375, 3.2265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 9.0, 11.0, 16.0, 10.0, 13.0, 17.0, 20.0, 35.0, 54.0, 70.0, 94.0, 135.0, 255.0, 438.0, 1143.0, 4768.0, 33193.0, 520498.0, 3229445.0, 371754.0, 26251.0, 3902.0, 1009.0, 466.0, 229.0, 133.0, 87.0, 61.0, 41.0, 29.0, 15.0, 20.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-15.2734375, -14.8543701171875, -14.435302734375, -14.0162353515625, -13.59716796875, -13.1781005859375, -12.759033203125, -12.3399658203125, -11.9208984375, -11.5018310546875, -11.082763671875, -10.6636962890625, -10.24462890625, -9.8255615234375, -9.406494140625, -8.9874267578125, -8.568359375, -8.1492919921875, -7.730224609375, -7.3111572265625, -6.89208984375, -6.4730224609375, -6.053955078125, -5.6348876953125, -5.2158203125, -4.7967529296875, -4.377685546875, -3.9586181640625, -3.53955078125, -3.1204833984375, -2.701416015625, -2.2823486328125, -1.86328125, -1.4442138671875, -1.025146484375, -0.6060791015625, -0.18701171875, 0.2320556640625, 0.651123046875, 1.0701904296875, 1.4892578125, 1.9083251953125, 2.327392578125, 2.7464599609375, 3.16552734375, 3.5845947265625, 4.003662109375, 4.4227294921875, 4.841796875, 5.2608642578125, 5.679931640625, 6.0989990234375, 6.51806640625, 6.9371337890625, 7.356201171875, 7.7752685546875, 8.1943359375, 8.6134033203125, 9.032470703125, 9.4515380859375, 9.87060546875, 10.2896728515625, 10.708740234375, 11.1278076171875, 11.546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 19.0, 20.0, 35.0, 39.0, 83.0, 124.0, 179.0, 270.0, 474.0, 672.0, 685.0, 511.0, 330.0, 219.0, 139.0, 88.0, 76.0, 39.0, 20.0, 20.0, 12.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.231201171875, -17.68115234375, -17.131103515625, -16.5810546875, -16.031005859375, -15.48095703125, -14.930908203125, -14.380859375, -13.830810546875, -13.28076171875, -12.730712890625, -12.1806640625, -11.630615234375, -11.08056640625, -10.530517578125, -9.98046875, -9.430419921875, -8.88037109375, -8.330322265625, -7.7802734375, -7.230224609375, -6.68017578125, -6.130126953125, -5.580078125, -5.030029296875, -4.47998046875, -3.929931640625, -3.3798828125, -2.829833984375, -2.27978515625, -1.729736328125, -1.1796875, -0.629638671875, -0.07958984375, 0.470458984375, 1.0205078125, 1.570556640625, 2.12060546875, 2.670654296875, 3.220703125, 3.770751953125, 4.32080078125, 4.870849609375, 5.4208984375, 5.970947265625, 6.52099609375, 7.071044921875, 7.62109375, 8.171142578125, 8.72119140625, 9.271240234375, 9.8212890625, 10.371337890625, 10.92138671875, 11.471435546875, 12.021484375, 12.571533203125, 13.12158203125, 13.671630859375, 14.2216796875, 14.771728515625, 15.32177734375, 15.871826171875, 16.421875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 11.0, 15.0, 18.0, 31.0, 38.0, 63.0, 100.0, 157.0, 279.0, 422.0, 982.0, 4997.0, 154571.0, 3914460.0, 111998.0, 4081.0, 984.0, 412.0, 219.0, 138.0, 98.0, 64.0, 43.0, 24.0, 24.0, 12.0, 10.0, 5.0, 11.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.53125, -27.26123046875, -25.9912109375, -24.72119140625, -23.451171875, -22.18115234375, -20.9111328125, -19.64111328125, -18.37109375, -17.10107421875, -15.8310546875, -14.56103515625, -13.291015625, -12.02099609375, -10.7509765625, -9.48095703125, -8.2109375, -6.94091796875, -5.6708984375, -4.40087890625, -3.130859375, -1.86083984375, -0.5908203125, 0.67919921875, 1.94921875, 3.21923828125, 4.4892578125, 5.75927734375, 7.029296875, 8.29931640625, 9.5693359375, 10.83935546875, 12.109375, 13.37939453125, 14.6494140625, 15.91943359375, 17.189453125, 18.45947265625, 19.7294921875, 20.99951171875, 22.26953125, 23.53955078125, 24.8095703125, 26.07958984375, 27.349609375, 28.61962890625, 29.8896484375, 31.15966796875, 32.4296875, 33.69970703125, 34.9697265625, 36.23974609375, 37.509765625, 38.77978515625, 40.0498046875, 41.31982421875, 42.58984375, 43.85986328125, 45.1298828125, 46.39990234375, 47.669921875, 48.93994140625, 50.2099609375, 51.47998046875, 52.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 78.0, 507.0, 393.0, 35.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-412.53875732421875, -405.15386962890625, -397.7689514160156, -390.3840637207031, -382.9991760253906, -375.6142578125, -368.2293701171875, -360.844482421875, -353.4595947265625, -346.07470703125, -338.6897888183594, -331.3049011230469, -323.9200134277344, -316.53509521484375, -309.15020751953125, -301.76531982421875, -294.3804016113281, -286.9955139160156, -279.610595703125, -272.2257080078125, -264.8408203125, -257.4559326171875, -250.07101440429688, -242.68612670898438, -235.30123901367188, -227.9163360595703, -220.5314483642578, -213.14654541015625, -205.76165771484375, -198.3767547607422, -190.99185180664062, -183.60696411132812, -176.22206115722656, -168.837158203125, -161.4522705078125, -154.06736755371094, -146.68247985839844, -139.29757690429688, -131.91268920898438, -124.52778625488281, -117.14288330078125, -109.75798797607422, -102.37309265136719, -94.98818969726562, -87.6032943725586, -80.21839904785156, -72.83350372314453, -65.4486083984375, -58.0637092590332, -50.67881393432617, -43.293914794921875, -35.909019470214844, -28.52412223815918, -21.139225006103516, -13.754329681396484, -6.3694305419921875, 1.0154647827148438, 8.400362014770508, 15.785258293151855, 23.170154571533203, 30.555051803588867, 37.93994903564453, 45.32484436035156, 52.70974349975586, 60.09463882446289]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 9.0, 9.0, 8.0, 12.0, 10.0, 21.0, 19.0, 21.0, 21.0, 25.0, 29.0, 21.0, 32.0, 23.0, 30.0, 26.0, 32.0, 34.0, 30.0, 38.0, 40.0, 45.0, 22.0, 43.0, 25.0, 26.0, 39.0, 34.0, 36.0, 27.0, 23.0, 19.0, 20.0, 18.0, 25.0, 20.0, 10.0, 11.0, 12.0, 15.0, 9.0, 5.0, 10.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-36.43756103515625, -35.34339904785156, -34.249237060546875, -33.15507507324219, -32.0609130859375, -30.96674919128418, -29.87258529663086, -28.778423309326172, -27.684261322021484, -26.590099334716797, -25.49593734741211, -24.40177345275879, -23.3076114654541, -22.213449478149414, -21.119285583496094, -20.025123596191406, -18.93096160888672, -17.83679962158203, -16.742637634277344, -15.648473739624023, -14.554311752319336, -13.460149765014648, -12.365986824035645, -11.27182388305664, -10.177661895751953, -9.083499908447266, -7.989336967468262, -6.895174503326416, -5.80101203918457, -4.706849575042725, -3.612687110900879, -2.518524646759033, -1.4243621826171875, -0.3301997184753418, 0.7639627456665039, 1.8581252098083496, 2.9522876739501953, 4.046450138092041, 5.140612602233887, 6.234775066375732, 7.328937530517578, 8.423099517822266, 9.51726245880127, 10.611425399780273, 11.705587387084961, 12.799749374389648, 13.893912315368652, 14.988075256347656, 16.082237243652344, 17.17639923095703, 18.27056121826172, 19.36472511291504, 20.458887100219727, 21.553049087524414, 22.647212982177734, 23.741374969482422, 24.83553695678711, 25.929698944091797, 27.023860931396484, 28.118024826049805, 29.212186813354492, 30.30634880065918, 31.4005126953125, 32.49467468261719, 33.588836669921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 10.0, 22.0, 25.0, 17.0, 36.0, 39.0, 36.0, 26.0, 42.0, 44.0, 50.0, 46.0, 54.0, 47.0, 55.0, 52.0, 44.0, 60.0, 34.0, 35.0, 22.0, 29.0, 21.0, 23.0, 13.0, 14.0, 12.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0396728515625, -3.915283203125, -3.7908935546875, -3.66650390625, -3.5421142578125, -3.417724609375, -3.2933349609375, -3.1689453125, -3.0445556640625, -2.920166015625, -2.7957763671875, -2.67138671875, -2.5469970703125, -2.422607421875, -2.2982177734375, -2.173828125, -2.0494384765625, -1.925048828125, -1.8006591796875, -1.67626953125, -1.5518798828125, -1.427490234375, -1.3031005859375, -1.1787109375, -1.0543212890625, -0.929931640625, -0.8055419921875, -0.68115234375, -0.5567626953125, -0.432373046875, -0.3079833984375, -0.18359375, -0.0592041015625, 0.065185546875, 0.1895751953125, 0.31396484375, 0.4383544921875, 0.562744140625, 0.6871337890625, 0.8115234375, 0.9359130859375, 1.060302734375, 1.1846923828125, 1.30908203125, 1.4334716796875, 1.557861328125, 1.6822509765625, 1.806640625, 1.9310302734375, 2.055419921875, 2.1798095703125, 2.30419921875, 2.4285888671875, 2.552978515625, 2.6773681640625, 2.8017578125, 2.9261474609375, 3.050537109375, 3.1749267578125, 3.29931640625, 3.4237060546875, 3.548095703125, 3.6724853515625, 3.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 11.0, 14.0, 30.0, 34.0, 63.0, 97.0, 141.0, 241.0, 382.0, 612.0, 990.0, 1695.0, 3017.0, 5315.0, 9535.0, 17028.0, 30665.0, 56246.0, 111574.0, 234081.0, 281938.0, 141184.0, 69616.0, 36973.0, 20440.0, 11320.0, 6560.0, 3609.0, 2145.0, 1162.0, 664.0, 464.0, 251.0, 163.0, 94.0, 56.0, 45.0, 36.0, 22.0, 14.0, 10.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6634521484375, -0.642822265625, -0.6221923828125, -0.6015625, -0.5809326171875, -0.560302734375, -0.5396728515625, -0.51904296875, -0.4984130859375, -0.477783203125, -0.4571533203125, -0.4365234375, -0.4158935546875, -0.395263671875, -0.3746337890625, -0.35400390625, -0.3333740234375, -0.312744140625, -0.2921142578125, -0.271484375, -0.2508544921875, -0.230224609375, -0.2095947265625, -0.18896484375, -0.1683349609375, -0.147705078125, -0.1270751953125, -0.1064453125, -0.0858154296875, -0.065185546875, -0.0445556640625, -0.02392578125, -0.0032958984375, 0.017333984375, 0.0379638671875, 0.05859375, 0.0792236328125, 0.099853515625, 0.1204833984375, 0.14111328125, 0.1617431640625, 0.182373046875, 0.2030029296875, 0.2236328125, 0.2442626953125, 0.264892578125, 0.2855224609375, 0.30615234375, 0.3267822265625, 0.347412109375, 0.3680419921875, 0.388671875, 0.4093017578125, 0.429931640625, 0.4505615234375, 0.47119140625, 0.4918212890625, 0.512451171875, 0.5330810546875, 0.5537109375, 0.5743408203125, 0.594970703125, 0.6156005859375, 0.63623046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 11.0, 9.0, 14.0, 18.0, 15.0, 17.0, 22.0, 19.0, 25.0, 39.0, 42.0, 35.0, 41.0, 31.0, 41.0, 33.0, 31.0, 1063.0, 39.0, 41.0, 45.0, 35.0, 40.0, 41.0, 27.0, 32.0, 24.0, 30.0, 17.0, 19.0, 15.0, 17.0, 18.0, 12.0, 10.0, 13.0, 10.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.140625, -2.070465087890625, -2.00030517578125, -1.930145263671875, -1.8599853515625, -1.789825439453125, -1.71966552734375, -1.649505615234375, -1.579345703125, -1.509185791015625, -1.43902587890625, -1.368865966796875, -1.2987060546875, -1.228546142578125, -1.15838623046875, -1.088226318359375, -1.01806640625, -0.947906494140625, -0.87774658203125, -0.807586669921875, -0.7374267578125, -0.667266845703125, -0.59710693359375, -0.526947021484375, -0.456787109375, -0.386627197265625, -0.31646728515625, -0.246307373046875, -0.1761474609375, -0.105987548828125, -0.03582763671875, 0.034332275390625, 0.1044921875, 0.174652099609375, 0.24481201171875, 0.314971923828125, 0.3851318359375, 0.455291748046875, 0.52545166015625, 0.595611572265625, 0.665771484375, 0.735931396484375, 0.80609130859375, 0.876251220703125, 0.9464111328125, 1.016571044921875, 1.08673095703125, 1.156890869140625, 1.22705078125, 1.297210693359375, 1.36737060546875, 1.437530517578125, 1.5076904296875, 1.577850341796875, 1.64801025390625, 1.718170166015625, 1.788330078125, 1.858489990234375, 1.92864990234375, 1.998809814453125, 2.0689697265625, 2.139129638671875, 2.20928955078125, 2.279449462890625, 2.349609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 5.0, 10.0, 22.0, 18.0, 41.0, 60.0, 101.0, 125.0, 209.0, 337.0, 533.0, 921.0, 1533.0, 2631.0, 4345.0, 7707.0, 13837.0, 24416.0, 45091.0, 85555.0, 166151.0, 1307196.0, 203635.0, 107578.0, 55908.0, 29741.0, 16629.0, 9448.0, 5511.0, 3094.0, 1856.0, 1139.0, 646.0, 405.0, 255.0, 151.0, 95.0, 68.0, 43.0, 21.0, 22.0, 16.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.462890625, -0.4491424560546875, -0.435394287109375, -0.4216461181640625, -0.40789794921875, -0.3941497802734375, -0.380401611328125, -0.3666534423828125, -0.3529052734375, -0.3391571044921875, -0.325408935546875, -0.3116607666015625, -0.29791259765625, -0.2841644287109375, -0.270416259765625, -0.2566680908203125, -0.242919921875, -0.2291717529296875, -0.215423583984375, -0.2016754150390625, -0.18792724609375, -0.1741790771484375, -0.160430908203125, -0.1466827392578125, -0.1329345703125, -0.1191864013671875, -0.105438232421875, -0.0916900634765625, -0.07794189453125, -0.0641937255859375, -0.050445556640625, -0.0366973876953125, -0.02294921875, -0.0092010498046875, 0.004547119140625, 0.0182952880859375, 0.03204345703125, 0.0457916259765625, 0.059539794921875, 0.0732879638671875, 0.0870361328125, 0.1007843017578125, 0.114532470703125, 0.1282806396484375, 0.14202880859375, 0.1557769775390625, 0.169525146484375, 0.1832733154296875, 0.197021484375, 0.2107696533203125, 0.224517822265625, 0.2382659912109375, 0.25201416015625, 0.2657623291015625, 0.279510498046875, 0.2932586669921875, 0.3070068359375, 0.3207550048828125, 0.334503173828125, 0.3482513427734375, 0.36199951171875, 0.3757476806640625, 0.389495849609375, 0.4032440185546875, 0.4169921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 14.0, 10.0, 17.0, 13.0, 24.0, 20.0, 42.0, 35.0, 49.0, 58.0, 101.0, 94.0, 98.0, 93.0, 76.0, 62.0, 41.0, 21.0, 22.0, 19.0, 18.0, 11.0, 8.0, 12.0, 3.0, 5.0, 4.0, 8.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0033397674560546875, -0.0032536983489990234, -0.0031676292419433594, -0.0030815601348876953, -0.0029954910278320312, -0.002909421920776367, -0.002823352813720703, -0.002737283706665039, -0.002651214599609375, -0.002565145492553711, -0.002479076385498047, -0.002393007278442383, -0.0023069381713867188, -0.0022208690643310547, -0.0021347999572753906, -0.0020487308502197266, -0.0019626617431640625, -0.0018765926361083984, -0.0017905235290527344, -0.0017044544219970703, -0.0016183853149414062, -0.0015323162078857422, -0.0014462471008300781, -0.001360177993774414, -0.00127410888671875, -0.001188039779663086, -0.0011019706726074219, -0.0010159015655517578, -0.0009298324584960938, -0.0008437633514404297, -0.0007576942443847656, -0.0006716251373291016, -0.0005855560302734375, -0.0004994869232177734, -0.0004134178161621094, -0.0003273487091064453, -0.00024127960205078125, -0.0001552104949951172, -6.914138793945312e-05, 1.6927719116210938e-05, 0.000102996826171875, 0.00018906593322753906, 0.0002751350402832031, 0.0003612041473388672, 0.00044727325439453125, 0.0005333423614501953, 0.0006194114685058594, 0.0007054805755615234, 0.0007915496826171875, 0.0008776187896728516, 0.0009636878967285156, 0.0010497570037841797, 0.0011358261108398438, 0.0012218952178955078, 0.0013079643249511719, 0.001394033432006836, 0.0014801025390625, 0.001566171646118164, 0.0016522407531738281, 0.0017383098602294922, 0.0018243789672851562, 0.0019104480743408203, 0.0019965171813964844, 0.0020825862884521484, 0.0021686553955078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 11.0, 9.0, 20.0, 15.0, 21.0, 27.0, 35.0, 67.0, 104.0, 215.0, 367.0, 1204.0, 1042886.0, 2535.0, 474.0, 175.0, 102.0, 67.0, 46.0, 30.0, 28.0, 13.0, 15.0, 18.0, 10.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.05527687072753906, -0.053119659423828125, -0.05096244812011719, -0.04880523681640625, -0.04664802551269531, -0.044490814208984375, -0.04233360290527344, -0.0401763916015625, -0.03801918029785156, -0.035861968994140625, -0.03370475769042969, -0.03154754638671875, -0.029390335083007812, -0.027233123779296875, -0.025075912475585938, -0.022918701171875, -0.020761489868164062, -0.018604278564453125, -0.016447067260742188, -0.01428985595703125, -0.012132644653320312, -0.009975433349609375, -0.007818222045898438, -0.0056610107421875, -0.0035037994384765625, -0.001346588134765625, 0.0008106231689453125, 0.00296783447265625, 0.0051250457763671875, 0.007282257080078125, 0.009439468383789062, 0.0115966796875, 0.013753890991210938, 0.015911102294921875, 0.018068313598632812, 0.02022552490234375, 0.022382736206054688, 0.024539947509765625, 0.026697158813476562, 0.0288543701171875, 0.031011581420898438, 0.033168792724609375, 0.03532600402832031, 0.03748321533203125, 0.03964042663574219, 0.041797637939453125, 0.04395484924316406, 0.046112060546875, 0.04826927185058594, 0.050426483154296875, 0.05258369445800781, 0.05474090576171875, 0.05689811706542969, 0.059055328369140625, 0.06121253967285156, 0.0633697509765625, 0.06552696228027344, 0.06768417358398438, 0.06984138488769531, 0.07199859619140625, 0.07415580749511719, 0.07631301879882812, 0.07847023010253906, 0.08062744140625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1018.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006074903532862663, -0.0038381684571504593, -0.0016014333814382553, 0.0006353016942739487, 0.0028720367699861526, 0.005108771845698357, 0.007345506921410561, 0.009582241997122765, 0.011818977072834969, 0.014055712148547173, 0.016292447224259377, 0.01852918229997158, 0.020765917375683784, 0.02300265245139599, 0.025239387527108192, 0.027476122602820396, 0.0297128576785326, 0.031949594616889954, 0.03418632596731186, 0.03642306476831436, 0.03865979611873627, 0.04089653491973877, 0.043133266270160675, 0.04537000507116318, 0.04760673642158508, 0.04984347149729729, 0.05208020657300949, 0.054316941648721695, 0.0565536767244339, 0.0587904118001461, 0.06102714687585831, 0.06326387822628021, 0.06550061702728271, 0.06773735582828522, 0.06997408717870712, 0.07221081852912903, 0.07444755733013153, 0.07668429613113403, 0.07892102748155594, 0.08115775883197784, 0.08339449763298035, 0.08563123643398285, 0.08786796778440475, 0.09010469913482666, 0.09234143793582916, 0.09457817673683167, 0.09681490808725357, 0.09905163943767548, 0.10128837823867798, 0.10352511703968048, 0.10576184839010239, 0.10799857974052429, 0.1102353185415268, 0.1124720573425293, 0.1147087886929512, 0.11694552004337311, 0.11918225884437561, 0.12141899764537811, 0.12365572899580002, 0.12589246034622192, 0.12812919914722443, 0.13036593794822693, 0.13260266184806824, 0.13483940064907074, 0.13707613945007324]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 18.0, 24.0, 39.0, 46.0, 55.0, 53.0, 75.0, 91.0, 92.0, 85.0, 77.0, 86.0, 82.0, 57.0, 41.0, 39.0, 18.0, 13.0, 7.0, 6.0, 2.0, 2.0], "bins": [-0.0042359232902526855, -0.0041525838896632195, -0.004069244489073753, -0.003985905088484287, -0.003902565687894821, -0.003819226287305355, -0.003735886886715889, -0.003652547486126423, -0.003569208085536957, -0.0034858686849474907, -0.0034025292843580246, -0.0033191898837685585, -0.0032358504831790924, -0.0031525110825896263, -0.0030691716820001602, -0.002985832281410694, -0.002902492880821228, -0.002819153480231762, -0.002735814079642296, -0.0026524746790528297, -0.0025691352784633636, -0.0024857958778738976, -0.0024024564772844315, -0.0023191170766949654, -0.0022357776761054993, -0.002152438275516033, -0.002069098874926567, -0.001985759474337101, -0.0019024200737476349, -0.0018190806731581688, -0.0017357412725687027, -0.0016524018719792366, -0.0015690624713897705, -0.0014857230708003044, -0.0014023836702108383, -0.0013190442696213722, -0.0012357048690319061, -0.00115236546844244, -0.001069026067852974, -0.0009856866672635078, -0.0009023472666740417, -0.0008190078660845757, -0.0007356684654951096, -0.0006523290649056435, -0.0005689896643161774, -0.0004856502637267113, -0.0004023108631372452, -0.0003189714625477791, -0.000235632061958313, -0.0001522926613688469, -6.89532607793808e-05, 1.4386139810085297e-05, 9.772554039955139e-05, 0.0001810649409890175, 0.0002644043415784836, 0.0003477437421679497, 0.00043108314275741577, 0.0005144225433468819, 0.000597761943936348, 0.0006811013445258141, 0.0007644407451152802, 0.0008477801457047462, 0.0009311195462942123, 0.0010144589468836784, 0.0010977983474731445]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 10.0, 22.0, 25.0, 17.0, 36.0, 39.0, 36.0, 26.0, 42.0, 44.0, 50.0, 46.0, 54.0, 47.0, 55.0, 52.0, 44.0, 60.0, 34.0, 35.0, 22.0, 29.0, 21.0, 23.0, 13.0, 14.0, 12.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0396728515625, -3.915283203125, -3.7908935546875, -3.66650390625, -3.5421142578125, -3.417724609375, -3.2933349609375, -3.1689453125, -3.0445556640625, -2.920166015625, -2.7957763671875, -2.67138671875, -2.5469970703125, -2.422607421875, -2.2982177734375, -2.173828125, -2.0494384765625, -1.925048828125, -1.8006591796875, -1.67626953125, -1.5518798828125, -1.427490234375, -1.3031005859375, -1.1787109375, -1.0543212890625, -0.929931640625, -0.8055419921875, -0.68115234375, -0.5567626953125, -0.432373046875, -0.3079833984375, -0.18359375, -0.0592041015625, 0.065185546875, 0.1895751953125, 0.31396484375, 0.4383544921875, 0.562744140625, 0.6871337890625, 0.8115234375, 0.9359130859375, 1.060302734375, 1.1846923828125, 1.30908203125, 1.4334716796875, 1.557861328125, 1.6822509765625, 1.806640625, 1.9310302734375, 2.055419921875, 2.1798095703125, 2.30419921875, 2.4285888671875, 2.552978515625, 2.6773681640625, 2.8017578125, 2.9261474609375, 3.050537109375, 3.1749267578125, 3.29931640625, 3.4237060546875, 3.548095703125, 3.6724853515625, 3.796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 11.0, 11.0, 28.0, 33.0, 42.0, 60.0, 86.0, 133.0, 215.0, 288.0, 488.0, 705.0, 1101.0, 1927.0, 3386.0, 6268.0, 12189.0, 25005.0, 59744.0, 172050.0, 439991.0, 199976.0, 67673.0, 27935.0, 13191.0, 6851.0, 3643.0, 2068.0, 1201.0, 792.0, 476.0, 313.0, 194.0, 147.0, 78.0, 76.0, 58.0, 32.0, 25.0, 16.0, 12.0, 1.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.74041748046875, -2.6507568359375, -2.56109619140625, -2.471435546875, -2.38177490234375, -2.2921142578125, -2.20245361328125, -2.11279296875, -2.02313232421875, -1.9334716796875, -1.84381103515625, -1.754150390625, -1.66448974609375, -1.5748291015625, -1.48516845703125, -1.3955078125, -1.30584716796875, -1.2161865234375, -1.12652587890625, -1.036865234375, -0.94720458984375, -0.8575439453125, -0.76788330078125, -0.67822265625, -0.58856201171875, -0.4989013671875, -0.40924072265625, -0.319580078125, -0.22991943359375, -0.1402587890625, -0.05059814453125, 0.0390625, 0.12872314453125, 0.2183837890625, 0.30804443359375, 0.397705078125, 0.48736572265625, 0.5770263671875, 0.66668701171875, 0.75634765625, 0.84600830078125, 0.9356689453125, 1.02532958984375, 1.114990234375, 1.20465087890625, 1.2943115234375, 1.38397216796875, 1.4736328125, 1.56329345703125, 1.6529541015625, 1.74261474609375, 1.832275390625, 1.92193603515625, 2.0115966796875, 2.10125732421875, 2.19091796875, 2.28057861328125, 2.3702392578125, 2.45989990234375, 2.549560546875, 2.63922119140625, 2.7288818359375, 2.81854248046875, 2.908203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 2.0, 10.0, 6.0, 17.0, 6.0, 7.0, 13.0, 24.0, 24.0, 22.0, 25.0, 36.0, 33.0, 34.0, 43.0, 47.0, 61.0, 64.0, 137.0, 1769.0, 167.0, 68.0, 59.0, 44.0, 43.0, 46.0, 40.0, 31.0, 25.0, 25.0, 25.0, 20.0, 23.0, 12.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9193115234375, -11.502685546875, -11.0860595703125, -10.66943359375, -10.2528076171875, -9.836181640625, -9.4195556640625, -9.0029296875, -8.5863037109375, -8.169677734375, -7.7530517578125, -7.33642578125, -6.9197998046875, -6.503173828125, -6.0865478515625, -5.669921875, -5.2532958984375, -4.836669921875, -4.4200439453125, -4.00341796875, -3.5867919921875, -3.170166015625, -2.7535400390625, -2.3369140625, -1.9202880859375, -1.503662109375, -1.0870361328125, -0.67041015625, -0.2537841796875, 0.162841796875, 0.5794677734375, 0.99609375, 1.4127197265625, 1.829345703125, 2.2459716796875, 2.66259765625, 3.0792236328125, 3.495849609375, 3.9124755859375, 4.3291015625, 4.7457275390625, 5.162353515625, 5.5789794921875, 5.99560546875, 6.4122314453125, 6.828857421875, 7.2454833984375, 7.662109375, 8.0787353515625, 8.495361328125, 8.9119873046875, 9.32861328125, 9.7452392578125, 10.161865234375, 10.5784912109375, 10.9951171875, 11.4117431640625, 11.828369140625, 12.2449951171875, 12.66162109375, 13.0782470703125, 13.494873046875, 13.9114990234375, 14.328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 7.0, 9.0, 14.0, 24.0, 29.0, 40.0, 32.0, 41.0, 60.0, 78.0, 94.0, 199.0, 380.0, 1075.0, 7280.0, 840275.0, 2284413.0, 9270.0, 1228.0, 424.0, 197.0, 118.0, 91.0, 62.0, 47.0, 41.0, 33.0, 21.0, 22.0, 13.0, 13.0, 12.0, 13.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-24.28125, -23.58837890625, -22.8955078125, -22.20263671875, -21.509765625, -20.81689453125, -20.1240234375, -19.43115234375, -18.73828125, -18.04541015625, -17.3525390625, -16.65966796875, -15.966796875, -15.27392578125, -14.5810546875, -13.88818359375, -13.1953125, -12.50244140625, -11.8095703125, -11.11669921875, -10.423828125, -9.73095703125, -9.0380859375, -8.34521484375, -7.65234375, -6.95947265625, -6.2666015625, -5.57373046875, -4.880859375, -4.18798828125, -3.4951171875, -2.80224609375, -2.109375, -1.41650390625, -0.7236328125, -0.03076171875, 0.662109375, 1.35498046875, 2.0478515625, 2.74072265625, 3.43359375, 4.12646484375, 4.8193359375, 5.51220703125, 6.205078125, 6.89794921875, 7.5908203125, 8.28369140625, 8.9765625, 9.66943359375, 10.3623046875, 11.05517578125, 11.748046875, 12.44091796875, 13.1337890625, 13.82666015625, 14.51953125, 15.21240234375, 15.9052734375, 16.59814453125, 17.291015625, 17.98388671875, 18.6767578125, 19.36962890625, 20.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 12.0, 37.0, 132.0, 280.0, 288.0, 177.0, 58.0, 23.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.660255432128906, -35.67465591430664, -34.68905258178711, -33.703453063964844, -32.71785354614258, -31.73225212097168, -30.74665069580078, -29.761051177978516, -28.775449752807617, -27.78984832763672, -26.804248809814453, -25.818647384643555, -24.833045959472656, -23.84744644165039, -22.861845016479492, -21.876243591308594, -20.890644073486328, -19.90504264831543, -18.919443130493164, -17.933841705322266, -16.948240280151367, -15.962640762329102, -14.977039337158203, -13.991438865661621, -13.005836486816406, -12.020236015319824, -11.034634590148926, -10.049034118652344, -9.063433647155762, -8.07783317565918, -7.092231750488281, -6.106631278991699, -5.121030807495117, -4.135429859161377, -3.149829387664795, -2.1642284393310547, -1.1786277294158936, -0.19302701950073242, 0.7925739288330078, 1.7781744003295898, 2.76377534866333, 3.749376058578491, 4.734976768493652, 5.720577716827393, 6.706178665161133, 7.691779136657715, 8.677379608154297, 9.662981033325195, 10.648581504821777, 11.63418197631836, 12.619783401489258, 13.60538387298584, 14.590984344482422, 15.57658576965332, 16.56218719482422, 17.547786712646484, 18.533388137817383, 19.51898956298828, 20.504589080810547, 21.490190505981445, 22.475791931152344, 23.46139144897461, 24.446992874145508, 25.432594299316406, 26.418193817138672]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 3.0, 4.0, 7.0, 11.0, 17.0, 14.0, 18.0, 28.0, 38.0, 42.0, 36.0, 39.0, 46.0, 52.0, 47.0, 51.0, 49.0, 40.0, 44.0, 41.0, 39.0, 36.0, 41.0, 32.0, 33.0, 22.0, 24.0, 30.0, 17.0, 24.0, 8.0, 12.0, 9.0, 10.0, 11.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.41718673706055, -43.99454879760742, -42.5719108581543, -41.14927291870117, -39.72663116455078, -38.303993225097656, -36.88135528564453, -35.458717346191406, -34.03607940673828, -32.613441467285156, -31.19080352783203, -29.768163681030273, -28.34552574157715, -26.922887802124023, -25.500247955322266, -24.07761001586914, -22.654972076416016, -21.23233413696289, -19.809696197509766, -18.387056350708008, -16.964418411254883, -15.541780471801758, -14.119141578674316, -12.696502685546875, -11.27386474609375, -9.851226806640625, -8.428587913513184, -7.0059494972229, -5.583311080932617, -4.160672664642334, -2.738034248352051, -1.3153953552246094, 0.10724639892578125, 1.5298848152160645, 2.9525232315063477, 4.375161647796631, 5.797800064086914, 7.220438480377197, 8.64307689666748, 10.065715789794922, 11.488353729248047, 12.910991668701172, 14.333630561828613, 15.756269454956055, 17.17890739440918, 18.601545333862305, 20.024185180664062, 21.446823120117188, 22.869461059570312, 24.292098999023438, 25.714736938476562, 27.13737678527832, 28.560014724731445, 29.98265266418457, 31.405292510986328, 32.82793045043945, 34.25056838989258, 35.6732063293457, 37.09584426879883, 38.51848220825195, 39.941123962402344, 41.36376190185547, 42.786399841308594, 44.20903778076172, 45.631675720214844]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 8.0, 4.0, 6.0, 6.0, 10.0, 10.0, 11.0, 20.0, 20.0, 20.0, 19.0, 32.0, 35.0, 35.0, 31.0, 41.0, 45.0, 52.0, 44.0, 58.0, 45.0, 55.0, 61.0, 40.0, 42.0, 49.0, 37.0, 22.0, 26.0, 20.0, 20.0, 14.0, 24.0, 7.0, 7.0, 5.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.0550537109375, -3.926513671875, -3.7979736328125, -3.66943359375, -3.5408935546875, -3.412353515625, -3.2838134765625, -3.1552734375, -3.0267333984375, -2.898193359375, -2.7696533203125, -2.64111328125, -2.5125732421875, -2.384033203125, -2.2554931640625, -2.126953125, -1.9984130859375, -1.869873046875, -1.7413330078125, -1.61279296875, -1.4842529296875, -1.355712890625, -1.2271728515625, -1.0986328125, -0.9700927734375, -0.841552734375, -0.7130126953125, -0.58447265625, -0.4559326171875, -0.327392578125, -0.1988525390625, -0.0703125, 0.0582275390625, 0.186767578125, 0.3153076171875, 0.44384765625, 0.5723876953125, 0.700927734375, 0.8294677734375, 0.9580078125, 1.0865478515625, 1.215087890625, 1.3436279296875, 1.47216796875, 1.6007080078125, 1.729248046875, 1.8577880859375, 1.986328125, 2.1148681640625, 2.243408203125, 2.3719482421875, 2.50048828125, 2.6290283203125, 2.757568359375, 2.8861083984375, 3.0146484375, 3.1431884765625, 3.271728515625, 3.4002685546875, 3.52880859375, 3.6573486328125, 3.785888671875, 3.9144287109375, 4.04296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 6.0, 9.0, 14.0, 16.0, 19.0, 20.0, 14.0, 31.0, 27.0, 23.0, 28.0, 43.0, 54.0, 162.0, 665.0, 4494.0, 87891.0, 3497458.0, 587731.0, 13508.0, 1348.0, 298.0, 102.0, 46.0, 46.0, 22.0, 21.0, 27.0, 27.0, 20.0, 21.0, 13.0, 11.0, 11.0, 10.0, 7.0, 9.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.719970703125, -17.08056640625, -16.441162109375, -15.8017578125, -15.162353515625, -14.52294921875, -13.883544921875, -13.244140625, -12.604736328125, -11.96533203125, -11.325927734375, -10.6865234375, -10.047119140625, -9.40771484375, -8.768310546875, -8.12890625, -7.489501953125, -6.85009765625, -6.210693359375, -5.5712890625, -4.931884765625, -4.29248046875, -3.653076171875, -3.013671875, -2.374267578125, -1.73486328125, -1.095458984375, -0.4560546875, 0.183349609375, 0.82275390625, 1.462158203125, 2.1015625, 2.740966796875, 3.38037109375, 4.019775390625, 4.6591796875, 5.298583984375, 5.93798828125, 6.577392578125, 7.216796875, 7.856201171875, 8.49560546875, 9.135009765625, 9.7744140625, 10.413818359375, 11.05322265625, 11.692626953125, 12.33203125, 12.971435546875, 13.61083984375, 14.250244140625, 14.8896484375, 15.529052734375, 16.16845703125, 16.807861328125, 17.447265625, 18.086669921875, 18.72607421875, 19.365478515625, 20.0048828125, 20.644287109375, 21.28369140625, 21.923095703125, 22.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 11.0, 15.0, 15.0, 25.0, 39.0, 37.0, 70.0, 99.0, 163.0, 211.0, 302.0, 452.0, 590.0, 595.0, 467.0, 306.0, 216.0, 138.0, 103.0, 75.0, 46.0, 28.0, 23.0, 13.0, 9.0, 9.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-18.890625, -18.4508056640625, -18.010986328125, -17.5711669921875, -17.13134765625, -16.6915283203125, -16.251708984375, -15.8118896484375, -15.3720703125, -14.9322509765625, -14.492431640625, -14.0526123046875, -13.61279296875, -13.1729736328125, -12.733154296875, -12.2933349609375, -11.853515625, -11.4136962890625, -10.973876953125, -10.5340576171875, -10.09423828125, -9.6544189453125, -9.214599609375, -8.7747802734375, -8.3349609375, -7.8951416015625, -7.455322265625, -7.0155029296875, -6.57568359375, -6.1358642578125, -5.696044921875, -5.2562255859375, -4.81640625, -4.3765869140625, -3.936767578125, -3.4969482421875, -3.05712890625, -2.6173095703125, -2.177490234375, -1.7376708984375, -1.2978515625, -0.8580322265625, -0.418212890625, 0.0216064453125, 0.46142578125, 0.9012451171875, 1.341064453125, 1.7808837890625, 2.220703125, 2.6605224609375, 3.100341796875, 3.5401611328125, 3.97998046875, 4.4197998046875, 4.859619140625, 5.2994384765625, 5.7392578125, 6.1790771484375, 6.618896484375, 7.0587158203125, 7.49853515625, 7.9383544921875, 8.378173828125, 8.8179931640625, 9.2578125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 18.0, 26.0, 44.0, 59.0, 105.0, 175.0, 312.0, 570.0, 2230.0, 105036.0, 4047379.0, 35649.0, 1552.0, 472.0, 259.0, 134.0, 105.0, 58.0, 34.0, 12.0, 13.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -37.94580078125, -36.1728515625, -34.39990234375, -32.626953125, -30.85400390625, -29.0810546875, -27.30810546875, -25.53515625, -23.76220703125, -21.9892578125, -20.21630859375, -18.443359375, -16.67041015625, -14.8974609375, -13.12451171875, -11.3515625, -9.57861328125, -7.8056640625, -6.03271484375, -4.259765625, -2.48681640625, -0.7138671875, 1.05908203125, 2.83203125, 4.60498046875, 6.3779296875, 8.15087890625, 9.923828125, 11.69677734375, 13.4697265625, 15.24267578125, 17.015625, 18.78857421875, 20.5615234375, 22.33447265625, 24.107421875, 25.88037109375, 27.6533203125, 29.42626953125, 31.19921875, 32.97216796875, 34.7451171875, 36.51806640625, 38.291015625, 40.06396484375, 41.8369140625, 43.60986328125, 45.3828125, 47.15576171875, 48.9287109375, 50.70166015625, 52.474609375, 54.24755859375, 56.0205078125, 57.79345703125, 59.56640625, 61.33935546875, 63.1123046875, 64.88525390625, 66.658203125, 68.43115234375, 70.2041015625, 71.97705078125, 73.75]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 38.0, 120.0, 311.0, 316.0, 167.0, 49.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-227.37490844726562, -223.09507751464844, -218.81524658203125, -214.53543090820312, -210.25559997558594, -205.97576904296875, -201.69595336914062, -197.41612243652344, -193.13629150390625, -188.85646057128906, -184.57662963867188, -180.29681396484375, -176.01698303222656, -171.73715209960938, -167.45733642578125, -163.17750549316406, -158.89767456054688, -154.6178436279297, -150.3380126953125, -146.05819702148438, -141.7783660888672, -137.49853515625, -133.21871948242188, -128.9388885498047, -124.6590576171875, -120.37922668457031, -116.09940338134766, -111.819580078125, -107.53974914550781, -103.25991821289062, -98.98009490966797, -94.70027160644531, -90.42044067382812, -86.14060974121094, -81.86078643798828, -77.58096313476562, -73.30113220214844, -69.02130126953125, -64.7414779663086, -60.46165084838867, -56.18182373046875, -51.90199661254883, -47.622169494628906, -43.342342376708984, -39.06251525878906, -34.78268814086914, -30.50286102294922, -26.223033905029297, -21.943206787109375, -17.663379669189453, -13.383552551269531, -9.10372543334961, -4.8238983154296875, -0.5440711975097656, 3.7357559204101562, 8.015583038330078, 12.29541015625, 16.575237274169922, 20.855064392089844, 25.134891510009766, 29.414718627929688, 33.69454574584961, 37.97437286376953, 42.25419998168945, 46.534027099609375]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 3.0, 7.0, 6.0, 6.0, 8.0, 10.0, 10.0, 14.0, 19.0, 12.0, 23.0, 30.0, 26.0, 27.0, 42.0, 25.0, 39.0, 41.0, 42.0, 43.0, 47.0, 49.0, 36.0, 46.0, 41.0, 37.0, 42.0, 26.0, 31.0, 28.0, 35.0, 33.0, 10.0, 18.0, 19.0, 15.0, 14.0, 7.0, 9.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.37052917480469, -35.0737419128418, -33.77695083618164, -32.48016357421875, -31.183374404907227, -29.886585235595703, -28.589797973632812, -27.29300880432129, -25.996219635009766, -24.699430465698242, -23.40264129638672, -22.105854034423828, -20.809064865112305, -19.51227569580078, -18.21548843383789, -16.918699264526367, -15.621910095214844, -14.32512092590332, -13.028332710266113, -11.731544494628906, -10.434755325317383, -9.13796615600586, -7.841177940368652, -6.544389724731445, -5.247600555419922, -3.9508118629455566, -2.6540231704711914, -1.3572344779968262, -0.06044578552246094, 1.2363429069519043, 2.5331315994262695, 3.8299198150634766, 5.126708984375, 6.423497676849365, 7.7202863693237305, 9.017074584960938, 10.313863754272461, 11.610652923583984, 12.907441139221191, 14.204229354858398, 15.501018524169922, 16.797807693481445, 18.09459686279297, 19.39138412475586, 20.688173294067383, 21.984962463378906, 23.281749725341797, 24.57853889465332, 25.875328063964844, 27.172117233276367, 28.46890640258789, 29.76569366455078, 31.062482833862305, 32.35927200317383, 33.65605926513672, 34.952850341796875, 36.249637603759766, 37.546424865722656, 38.84321594238281, 40.1400032043457, 41.436790466308594, 42.73358154296875, 44.03036880493164, 45.32715606689453, 46.62394714355469]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 18.0, 19.0, 15.0, 22.0, 23.0, 29.0, 34.0, 28.0, 28.0, 33.0, 54.0, 56.0, 47.0, 55.0, 50.0, 47.0, 44.0, 46.0, 51.0, 35.0, 32.0, 29.0, 27.0, 23.0, 25.0, 11.0, 13.0, 12.0, 14.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0997314453125, -3.968994140625, -3.8382568359375, -3.70751953125, -3.5767822265625, -3.446044921875, -3.3153076171875, -3.1845703125, -3.0538330078125, -2.923095703125, -2.7923583984375, -2.66162109375, -2.5308837890625, -2.400146484375, -2.2694091796875, -2.138671875, -2.0079345703125, -1.877197265625, -1.7464599609375, -1.61572265625, -1.4849853515625, -1.354248046875, -1.2235107421875, -1.0927734375, -0.9620361328125, -0.831298828125, -0.7005615234375, -0.56982421875, -0.4390869140625, -0.308349609375, -0.1776123046875, -0.046875, 0.0838623046875, 0.214599609375, 0.3453369140625, 0.47607421875, 0.6068115234375, 0.737548828125, 0.8682861328125, 0.9990234375, 1.1297607421875, 1.260498046875, 1.3912353515625, 1.52197265625, 1.6527099609375, 1.783447265625, 1.9141845703125, 2.044921875, 2.1756591796875, 2.306396484375, 2.4371337890625, 2.56787109375, 2.6986083984375, 2.829345703125, 2.9600830078125, 3.0908203125, 3.2215576171875, 3.352294921875, 3.4830322265625, 3.61376953125, 3.7445068359375, 3.875244140625, 4.0059814453125, 4.13671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 20.0, 16.0, 24.0, 42.0, 58.0, 80.0, 117.0, 157.0, 241.0, 380.0, 570.0, 886.0, 1497.0, 2306.0, 3804.0, 6510.0, 11031.0, 18570.0, 32690.0, 59946.0, 117934.0, 232594.0, 260700.0, 139127.0, 69405.0, 37405.0, 21189.0, 12323.0, 7416.0, 4449.0, 2522.0, 1635.0, 1036.0, 680.0, 384.0, 258.0, 170.0, 117.0, 70.0, 54.0, 36.0, 28.0, 16.0, 9.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.626953125, -0.6068038940429688, -0.5866546630859375, -0.5665054321289062, -0.546356201171875, -0.5262069702148438, -0.5060577392578125, -0.48590850830078125, -0.46575927734375, -0.44561004638671875, -0.4254608154296875, -0.40531158447265625, -0.385162353515625, -0.36501312255859375, -0.3448638916015625, -0.32471466064453125, -0.3045654296875, -0.28441619873046875, -0.2642669677734375, -0.24411773681640625, -0.223968505859375, -0.20381927490234375, -0.1836700439453125, -0.16352081298828125, -0.14337158203125, -0.12322235107421875, -0.1030731201171875, -0.08292388916015625, -0.062774658203125, -0.04262542724609375, -0.0224761962890625, -0.00232696533203125, 0.017822265625, 0.03797149658203125, 0.0581207275390625, 0.07826995849609375, 0.098419189453125, 0.11856842041015625, 0.1387176513671875, 0.15886688232421875, 0.17901611328125, 0.19916534423828125, 0.2193145751953125, 0.23946380615234375, 0.259613037109375, 0.27976226806640625, 0.2999114990234375, 0.32006072998046875, 0.3402099609375, 0.36035919189453125, 0.3805084228515625, 0.40065765380859375, 0.420806884765625, 0.44095611572265625, 0.4611053466796875, 0.48125457763671875, 0.50140380859375, 0.5215530395507812, 0.5417022705078125, 0.5618515014648438, 0.582000732421875, 0.6021499633789062, 0.6222991943359375, 0.6424484252929688, 0.66259765625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 1.0, 3.0, 6.0, 7.0, 11.0, 7.0, 10.0, 11.0, 16.0, 21.0, 17.0, 30.0, 31.0, 29.0, 36.0, 38.0, 30.0, 32.0, 44.0, 49.0, 32.0, 40.0, 1054.0, 45.0, 39.0, 37.0, 32.0, 36.0, 26.0, 34.0, 22.0, 24.0, 27.0, 23.0, 20.0, 13.0, 13.0, 20.0, 15.0, 8.0, 6.0, 5.0, 2.0, 6.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.205078125, -2.135955810546875, -2.06683349609375, -1.997711181640625, -1.9285888671875, -1.859466552734375, -1.79034423828125, -1.721221923828125, -1.652099609375, -1.582977294921875, -1.51385498046875, -1.444732666015625, -1.3756103515625, -1.306488037109375, -1.23736572265625, -1.168243408203125, -1.09912109375, -1.029998779296875, -0.96087646484375, -0.891754150390625, -0.8226318359375, -0.753509521484375, -0.68438720703125, -0.615264892578125, -0.546142578125, -0.477020263671875, -0.40789794921875, -0.338775634765625, -0.2696533203125, -0.200531005859375, -0.13140869140625, -0.062286376953125, 0.0068359375, 0.075958251953125, 0.14508056640625, 0.214202880859375, 0.2833251953125, 0.352447509765625, 0.42156982421875, 0.490692138671875, 0.559814453125, 0.628936767578125, 0.69805908203125, 0.767181396484375, 0.8363037109375, 0.905426025390625, 0.97454833984375, 1.043670654296875, 1.11279296875, 1.181915283203125, 1.25103759765625, 1.320159912109375, 1.3892822265625, 1.458404541015625, 1.52752685546875, 1.596649169921875, 1.665771484375, 1.734893798828125, 1.80401611328125, 1.873138427734375, 1.9422607421875, 2.011383056640625, 2.08050537109375, 2.149627685546875, 2.21875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 7.0, 14.0, 20.0, 41.0, 42.0, 63.0, 117.0, 156.0, 262.0, 413.0, 754.0, 1091.0, 1867.0, 2972.0, 4949.0, 8411.0, 14433.0, 25282.0, 44767.0, 83069.0, 152201.0, 1284045.0, 206615.0, 118675.0, 63547.0, 34871.0, 19980.0, 11375.0, 6682.0, 3941.0, 2445.0, 1468.0, 913.0, 627.0, 349.0, 224.0, 138.0, 106.0, 62.0, 53.0, 19.0, 20.0, 16.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.4307861328125, -0.417236328125, -0.4036865234375, -0.39013671875, -0.3765869140625, -0.363037109375, -0.3494873046875, -0.3359375, -0.3223876953125, -0.308837890625, -0.2952880859375, -0.28173828125, -0.2681884765625, -0.254638671875, -0.2410888671875, -0.2275390625, -0.2139892578125, -0.200439453125, -0.1868896484375, -0.17333984375, -0.1597900390625, -0.146240234375, -0.1326904296875, -0.119140625, -0.1055908203125, -0.092041015625, -0.0784912109375, -0.06494140625, -0.0513916015625, -0.037841796875, -0.0242919921875, -0.0107421875, 0.0028076171875, 0.016357421875, 0.0299072265625, 0.04345703125, 0.0570068359375, 0.070556640625, 0.0841064453125, 0.09765625, 0.1112060546875, 0.124755859375, 0.1383056640625, 0.15185546875, 0.1654052734375, 0.178955078125, 0.1925048828125, 0.2060546875, 0.2196044921875, 0.233154296875, 0.2467041015625, 0.26025390625, 0.2738037109375, 0.287353515625, 0.3009033203125, 0.314453125, 0.3280029296875, 0.341552734375, 0.3551025390625, 0.36865234375, 0.3822021484375, 0.395751953125, 0.4093017578125, 0.4228515625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 14.0, 7.0, 26.0, 29.0, 25.0, 43.0, 41.0, 51.0, 74.0, 64.0, 71.0, 62.0, 61.0, 69.0, 52.0, 51.0, 46.0, 34.0, 35.0, 19.0, 17.0, 11.0, 17.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017118453979492188, -0.0016632080078125, -0.0016145706176757812, -0.0015659332275390625, -0.0015172958374023438, -0.001468658447265625, -0.0014200210571289062, -0.0013713836669921875, -0.0013227462768554688, -0.00127410888671875, -0.0012254714965820312, -0.0011768341064453125, -0.0011281967163085938, -0.001079559326171875, -0.0010309219360351562, -0.0009822845458984375, -0.0009336471557617188, -0.000885009765625, -0.0008363723754882812, -0.0007877349853515625, -0.0007390975952148438, -0.000690460205078125, -0.0006418228149414062, -0.0005931854248046875, -0.0005445480346679688, -0.00049591064453125, -0.00044727325439453125, -0.0003986358642578125, -0.00034999847412109375, -0.000301361083984375, -0.00025272369384765625, -0.0002040863037109375, -0.00015544891357421875, -0.0001068115234375, -5.817413330078125e-05, -9.5367431640625e-06, 3.910064697265625e-05, 8.7738037109375e-05, 0.00013637542724609375, 0.0001850128173828125, 0.00023365020751953125, 0.00028228759765625, 0.00033092498779296875, 0.0003795623779296875, 0.00042819976806640625, 0.000476837158203125, 0.0005254745483398438, 0.0005741119384765625, 0.0006227493286132812, 0.00067138671875, 0.0007200241088867188, 0.0007686614990234375, 0.0008172988891601562, 0.000865936279296875, 0.0009145736694335938, 0.0009632110595703125, 0.0010118484497070312, 0.00106048583984375, 0.0011091232299804688, 0.0011577606201171875, 0.0012063980102539062, 0.001255035400390625, 0.0013036727905273438, 0.0013523101806640625, 0.0014009475708007812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 4.0, 6.0, 11.0, 13.0, 12.0, 17.0, 27.0, 24.0, 37.0, 64.0, 67.0, 114.0, 161.0, 369.0, 909.0, 533945.0, 510902.0, 898.0, 395.0, 163.0, 97.0, 74.0, 43.0, 41.0, 36.0, 21.0, 8.0, 10.0, 12.0, 18.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04388427734375, -0.04246854782104492, -0.041052818298339844, -0.039637088775634766, -0.03822135925292969, -0.03680562973022461, -0.03538990020751953, -0.03397417068481445, -0.032558441162109375, -0.031142711639404297, -0.02972698211669922, -0.02831125259399414, -0.026895523071289062, -0.025479793548583984, -0.024064064025878906, -0.022648334503173828, -0.02123260498046875, -0.019816875457763672, -0.018401145935058594, -0.016985416412353516, -0.015569686889648438, -0.01415395736694336, -0.012738227844238281, -0.011322498321533203, -0.009906768798828125, -0.008491039276123047, -0.007075309753417969, -0.005659580230712891, -0.0042438507080078125, -0.0028281211853027344, -0.0014123916625976562, 3.337860107421875e-06, 0.0014190673828125, 0.002834796905517578, 0.004250526428222656, 0.005666255950927734, 0.0070819854736328125, 0.00849771499633789, 0.009913444519042969, 0.011329174041748047, 0.012744903564453125, 0.014160633087158203, 0.015576362609863281, 0.01699209213256836, 0.018407821655273438, 0.019823551177978516, 0.021239280700683594, 0.022655010223388672, 0.02407073974609375, 0.025486469268798828, 0.026902198791503906, 0.028317928314208984, 0.029733657836914062, 0.03114938735961914, 0.03256511688232422, 0.0339808464050293, 0.035396575927734375, 0.03681230545043945, 0.03822803497314453, 0.03964376449584961, 0.04105949401855469, 0.042475223541259766, 0.043890953063964844, 0.04530668258666992, 0.046722412109375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1018.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007014077622443438, -0.00571267819032073, -0.0044112782925367355, -0.003109878860414028, -0.0018084794282913208, -0.0005070799961686134, 0.0007943199016153812, 0.0020957193337380886, 0.003397118765860796, 0.004698518197983503, 0.005999918095767498, 0.007301317527890205, 0.008602716960012913, 0.00990411639213562, 0.011205516755580902, 0.012506915256381035, 0.013808315619826317, 0.015109715051949024, 0.01641111448407173, 0.017712514847517014, 0.019013913348317146, 0.02031531371176243, 0.02161671221256256, 0.022918112576007843, 0.024219511076807976, 0.025520911440253258, 0.02682230994105339, 0.028123710304498672, 0.029425108805298805, 0.030726509168744087, 0.03202790766954422, 0.0333293080329895, 0.034630704671144485, 0.03593210503458977, 0.03723350539803505, 0.03853490203619003, 0.039836302399635315, 0.0411377027630806, 0.04243910312652588, 0.04374050348997116, 0.045041900128126144, 0.046343300491571426, 0.04764470085501671, 0.04894609749317169, 0.050247497856616974, 0.051548898220062256, 0.05285029858350754, 0.05415169894695282, 0.0554530993103981, 0.056754499673843384, 0.058055900037288666, 0.05935729667544365, 0.06065869703888893, 0.06196009740233421, 0.0632614940404892, 0.06456289440393448, 0.06586429476737976, 0.06716569513082504, 0.06846709549427032, 0.0697684958577156, 0.07106989622116089, 0.07237128913402557, 0.07367268949747086, 0.07497408986091614, 0.07627549022436142]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 7.0, 9.0, 15.0, 15.0, 22.0, 24.0, 19.0, 29.0, 45.0, 45.0, 47.0, 67.0, 62.0, 70.0, 53.0, 61.0, 47.0, 60.0, 52.0, 42.0, 45.0, 29.0, 27.0, 34.0, 19.0, 16.0, 13.0, 13.0, 12.0, 5.0, 2.0, 3.0], "bins": [-0.0016615986824035645, -0.0016258619725704193, -0.0015901252627372742, -0.001554388552904129, -0.0015186518430709839, -0.0014829151332378387, -0.0014471784234046936, -0.0014114417135715485, -0.0013757050037384033, -0.0013399682939052582, -0.001304231584072113, -0.001268494874238968, -0.0012327581644058228, -0.0011970214545726776, -0.0011612847447395325, -0.0011255480349063873, -0.0010898113250732422, -0.001054074615240097, -0.001018337905406952, -0.0009826011955738068, -0.0009468644857406616, -0.0009111277759075165, -0.0008753910660743713, -0.0008396543562412262, -0.0008039176464080811, -0.0007681809365749359, -0.0007324442267417908, -0.0006967075169086456, -0.0006609708070755005, -0.0006252340972423553, -0.0005894973874092102, -0.0005537606775760651, -0.0005180239677429199, -0.0004822872579097748, -0.00044655054807662964, -0.0004108138382434845, -0.00037507712841033936, -0.0003393404185771942, -0.00030360370874404907, -0.00026786699891090393, -0.0002321302890777588, -0.00019639357924461365, -0.0001606568694114685, -0.00012492015957832336, -8.918344974517822e-05, -5.344673991203308e-05, -1.771003007888794e-05, 1.8026679754257202e-05, 5.3763389587402344e-05, 8.950009942054749e-05, 0.00012523680925369263, 0.00016097351908683777, 0.0001967102289199829, 0.00023244693875312805, 0.0002681836485862732, 0.00030392035841941833, 0.0003396570682525635, 0.0003753937780857086, 0.00041113048791885376, 0.0004468671977519989, 0.00048260390758514404, 0.0005183406174182892, 0.0005540773272514343, 0.0005898140370845795, 0.0006255507469177246]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 18.0, 19.0, 15.0, 22.0, 23.0, 29.0, 34.0, 28.0, 28.0, 33.0, 54.0, 56.0, 47.0, 55.0, 50.0, 47.0, 44.0, 46.0, 51.0, 35.0, 32.0, 29.0, 27.0, 23.0, 25.0, 11.0, 13.0, 12.0, 14.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0997314453125, -3.968994140625, -3.8382568359375, -3.70751953125, -3.5767822265625, -3.446044921875, -3.3153076171875, -3.1845703125, -3.0538330078125, -2.923095703125, -2.7923583984375, -2.66162109375, -2.5308837890625, -2.400146484375, -2.2694091796875, -2.138671875, -2.0079345703125, -1.877197265625, -1.7464599609375, -1.61572265625, -1.4849853515625, -1.354248046875, -1.2235107421875, -1.0927734375, -0.9620361328125, -0.831298828125, -0.7005615234375, -0.56982421875, -0.4390869140625, -0.308349609375, -0.1776123046875, -0.046875, 0.0838623046875, 0.214599609375, 0.3453369140625, 0.47607421875, 0.6068115234375, 0.737548828125, 0.8682861328125, 0.9990234375, 1.1297607421875, 1.260498046875, 1.3912353515625, 1.52197265625, 1.6527099609375, 1.783447265625, 1.9141845703125, 2.044921875, 2.1756591796875, 2.306396484375, 2.4371337890625, 2.56787109375, 2.6986083984375, 2.829345703125, 2.9600830078125, 3.0908203125, 3.2215576171875, 3.352294921875, 3.4830322265625, 3.61376953125, 3.7445068359375, 3.875244140625, 4.0059814453125, 4.13671875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 14.0, 10.0, 13.0, 19.0, 24.0, 35.0, 57.0, 65.0, 110.0, 160.0, 246.0, 429.0, 722.0, 1277.0, 2468.0, 5173.0, 12257.0, 35204.0, 122409.0, 521154.0, 251345.0, 60355.0, 19652.0, 7634.0, 3519.0, 1754.0, 950.0, 529.0, 338.0, 213.0, 109.0, 93.0, 53.0, 39.0, 33.0, 27.0, 17.0, 14.0, 5.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.59375, -3.487213134765625, -3.38067626953125, -3.274139404296875, -3.1676025390625, -3.061065673828125, -2.95452880859375, -2.847991943359375, -2.741455078125, -2.634918212890625, -2.52838134765625, -2.421844482421875, -2.3153076171875, -2.208770751953125, -2.10223388671875, -1.995697021484375, -1.88916015625, -1.782623291015625, -1.67608642578125, -1.569549560546875, -1.4630126953125, -1.356475830078125, -1.24993896484375, -1.143402099609375, -1.036865234375, -0.930328369140625, -0.82379150390625, -0.717254638671875, -0.6107177734375, -0.504180908203125, -0.39764404296875, -0.291107177734375, -0.1845703125, -0.078033447265625, 0.02850341796875, 0.135040283203125, 0.2415771484375, 0.348114013671875, 0.45465087890625, 0.561187744140625, 0.667724609375, 0.774261474609375, 0.88079833984375, 0.987335205078125, 1.0938720703125, 1.200408935546875, 1.30694580078125, 1.413482666015625, 1.52001953125, 1.626556396484375, 1.73309326171875, 1.839630126953125, 1.9461669921875, 2.052703857421875, 2.15924072265625, 2.265777587890625, 2.372314453125, 2.478851318359375, 2.58538818359375, 2.691925048828125, 2.7984619140625, 2.904998779296875, 3.01153564453125, 3.118072509765625, 3.224609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 6.0, 11.0, 7.0, 17.0, 17.0, 24.0, 27.0, 35.0, 43.0, 39.0, 41.0, 44.0, 73.0, 95.0, 1734.0, 322.0, 84.0, 66.0, 43.0, 51.0, 40.0, 44.0, 30.0, 30.0, 17.0, 23.0, 15.0, 8.0, 13.0, 8.0, 3.0, 10.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-18.53125, -18.028076171875, -17.52490234375, -17.021728515625, -16.5185546875, -16.015380859375, -15.51220703125, -15.009033203125, -14.505859375, -14.002685546875, -13.49951171875, -12.996337890625, -12.4931640625, -11.989990234375, -11.48681640625, -10.983642578125, -10.48046875, -9.977294921875, -9.47412109375, -8.970947265625, -8.4677734375, -7.964599609375, -7.46142578125, -6.958251953125, -6.455078125, -5.951904296875, -5.44873046875, -4.945556640625, -4.4423828125, -3.939208984375, -3.43603515625, -2.932861328125, -2.4296875, -1.926513671875, -1.42333984375, -0.920166015625, -0.4169921875, 0.086181640625, 0.58935546875, 1.092529296875, 1.595703125, 2.098876953125, 2.60205078125, 3.105224609375, 3.6083984375, 4.111572265625, 4.61474609375, 5.117919921875, 5.62109375, 6.124267578125, 6.62744140625, 7.130615234375, 7.6337890625, 8.136962890625, 8.64013671875, 9.143310546875, 9.646484375, 10.149658203125, 10.65283203125, 11.156005859375, 11.6591796875, 12.162353515625, 12.66552734375, 13.168701171875, 13.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 3.0, 13.0, 13.0, 19.0, 24.0, 15.0, 33.0, 45.0, 55.0, 81.0, 108.0, 180.0, 342.0, 883.0, 8215.0, 3018011.0, 114333.0, 2089.0, 519.0, 228.0, 124.0, 95.0, 66.0, 48.0, 23.0, 21.0, 28.0, 16.0, 10.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.544921875, -19.77734375, -19.009765625, -18.2421875, -17.474609375, -16.70703125, -15.939453125, -15.171875, -14.404296875, -13.63671875, -12.869140625, -12.1015625, -11.333984375, -10.56640625, -9.798828125, -9.03125, -8.263671875, -7.49609375, -6.728515625, -5.9609375, -5.193359375, -4.42578125, -3.658203125, -2.890625, -2.123046875, -1.35546875, -0.587890625, 0.1796875, 0.947265625, 1.71484375, 2.482421875, 3.25, 4.017578125, 4.78515625, 5.552734375, 6.3203125, 7.087890625, 7.85546875, 8.623046875, 9.390625, 10.158203125, 10.92578125, 11.693359375, 12.4609375, 13.228515625, 13.99609375, 14.763671875, 15.53125, 16.298828125, 17.06640625, 17.833984375, 18.6015625, 19.369140625, 20.13671875, 20.904296875, 21.671875, 22.439453125, 23.20703125, 23.974609375, 24.7421875, 25.509765625, 26.27734375, 27.044921875, 27.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 47.0, 233.0, 381.0, 273.0, 60.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.573726654052734, -48.43610382080078, -47.29848098754883, -46.16085433959961, -45.023231506347656, -43.8856086730957, -42.74798583984375, -41.61035919189453, -40.47273635864258, -39.335113525390625, -38.19749069213867, -37.05986404418945, -35.9222412109375, -34.78461837768555, -33.646995544433594, -32.509368896484375, -31.371747970581055, -30.2341251373291, -29.096500396728516, -27.958877563476562, -26.821252822875977, -25.683629989624023, -24.546005249023438, -23.408382415771484, -22.27075958251953, -21.133136749267578, -19.995512008666992, -18.85788917541504, -17.720264434814453, -16.5826416015625, -15.44501781463623, -14.307394027709961, -13.169767379760742, -12.032143592834473, -10.894519805908203, -9.75689697265625, -8.619272232055664, -7.481648921966553, -6.344025611877441, -5.206401824951172, -4.068778038024902, -2.931154251098633, -1.7935307025909424, -0.655907154083252, 0.4817166328430176, 1.619340419769287, 2.7569637298583984, 3.894587516784668, 5.0322113037109375, 6.169835090637207, 7.307458877563477, 8.44508171081543, 9.582706451416016, 10.720329284667969, 11.857953071594238, 12.995576858520508, 14.133200645446777, 15.270824432373047, 16.408447265625, 17.546072006225586, 18.68369483947754, 19.821319580078125, 20.958942413330078, 22.09656524658203, 23.234189987182617]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 9.0, 6.0, 15.0, 11.0, 15.0, 14.0, 24.0, 27.0, 34.0, 29.0, 37.0, 31.0, 32.0, 34.0, 33.0, 44.0, 41.0, 27.0, 33.0, 46.0, 26.0, 43.0, 36.0, 31.0, 44.0, 38.0, 22.0, 22.0, 18.0, 19.0, 12.0, 21.0, 21.0, 19.0, 13.0, 8.0, 6.0, 13.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.89753723144531, -34.700870513916016, -33.50420379638672, -32.30754089355469, -31.11087417602539, -29.914207458496094, -28.717540740966797, -27.520875930786133, -26.32421112060547, -25.127544403076172, -23.930879592895508, -22.73421287536621, -21.537548065185547, -20.34088134765625, -19.144214630126953, -17.94754981994629, -16.750883102416992, -15.554217338562012, -14.357551574707031, -13.160884857177734, -11.96422004699707, -10.767553329467773, -9.570887565612793, -8.374221801757812, -7.177556037902832, -5.980890274047852, -4.784224510192871, -3.5875582695007324, -2.390892505645752, -1.1942267417907715, 0.0024394989013671875, 1.1991052627563477, 2.395771026611328, 3.5924367904663086, 4.789102554321289, 5.985768795013428, 7.182434558868408, 8.379100799560547, 9.575766563415527, 10.772432327270508, 11.969098091125488, 13.165763854980469, 14.36242961883545, 15.55909538269043, 16.755762100219727, 17.95242691040039, 19.149093627929688, 20.345760345458984, 21.54242515563965, 22.739091873168945, 23.93575668334961, 25.132423400878906, 26.32908821105957, 27.525754928588867, 28.72241973876953, 29.919086456298828, 31.115753173828125, 32.31241989135742, 33.50908660888672, 34.70574951171875, 35.90241622924805, 37.099082946777344, 38.29574966430664, 39.49241638183594, 40.68907928466797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 7.0, 8.0, 11.0, 12.0, 19.0, 14.0, 19.0, 22.0, 25.0, 23.0, 30.0, 31.0, 33.0, 37.0, 49.0, 52.0, 40.0, 66.0, 51.0, 42.0, 37.0, 50.0, 52.0, 45.0, 28.0, 27.0, 33.0, 30.0, 21.0, 10.0, 15.0, 10.0, 13.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.25201416015625, -4.1173095703125, -3.98260498046875, -3.847900390625, -3.71319580078125, -3.5784912109375, -3.44378662109375, -3.30908203125, -3.17437744140625, -3.0396728515625, -2.90496826171875, -2.770263671875, -2.63555908203125, -2.5008544921875, -2.36614990234375, -2.2314453125, -2.09674072265625, -1.9620361328125, -1.82733154296875, -1.692626953125, -1.55792236328125, -1.4232177734375, -1.28851318359375, -1.15380859375, -1.01910400390625, -0.8843994140625, -0.74969482421875, -0.614990234375, -0.48028564453125, -0.3455810546875, -0.21087646484375, -0.076171875, 0.05853271484375, 0.1932373046875, 0.32794189453125, 0.462646484375, 0.59735107421875, 0.7320556640625, 0.86676025390625, 1.00146484375, 1.13616943359375, 1.2708740234375, 1.40557861328125, 1.540283203125, 1.67498779296875, 1.8096923828125, 1.94439697265625, 2.0791015625, 2.21380615234375, 2.3485107421875, 2.48321533203125, 2.617919921875, 2.75262451171875, 2.8873291015625, 3.02203369140625, 3.15673828125, 3.29144287109375, 3.4261474609375, 3.56085205078125, 3.695556640625, 3.83026123046875, 3.9649658203125, 4.09967041015625, 4.234375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 11.0, 13.0, 11.0, 19.0, 32.0, 27.0, 70.0, 87.0, 168.0, 344.0, 946.0, 2709.0, 9599.0, 39473.0, 248779.0, 1945804.0, 1687099.0, 211583.0, 34633.0, 8597.0, 2537.0, 862.0, 372.0, 170.0, 89.0, 62.0, 44.0, 25.0, 11.0, 16.0, 15.0, 5.0, 10.0, 9.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.9765625, -9.691162109375, -9.40576171875, -9.120361328125, -8.8349609375, -8.549560546875, -8.26416015625, -7.978759765625, -7.693359375, -7.407958984375, -7.12255859375, -6.837158203125, -6.5517578125, -6.266357421875, -5.98095703125, -5.695556640625, -5.41015625, -5.124755859375, -4.83935546875, -4.553955078125, -4.2685546875, -3.983154296875, -3.69775390625, -3.412353515625, -3.126953125, -2.841552734375, -2.55615234375, -2.270751953125, -1.9853515625, -1.699951171875, -1.41455078125, -1.129150390625, -0.84375, -0.558349609375, -0.27294921875, 0.012451171875, 0.2978515625, 0.583251953125, 0.86865234375, 1.154052734375, 1.439453125, 1.724853515625, 2.01025390625, 2.295654296875, 2.5810546875, 2.866455078125, 3.15185546875, 3.437255859375, 3.72265625, 4.008056640625, 4.29345703125, 4.578857421875, 4.8642578125, 5.149658203125, 5.43505859375, 5.720458984375, 6.005859375, 6.291259765625, 6.57666015625, 6.862060546875, 7.1474609375, 7.432861328125, 7.71826171875, 8.003662109375, 8.2890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 23.0, 30.0, 32.0, 81.0, 96.0, 130.0, 257.0, 360.0, 543.0, 687.0, 599.0, 424.0, 291.0, 194.0, 100.0, 72.0, 50.0, 34.0, 19.0, 15.0, 3.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.2841796875, -17.771484375, -17.2587890625, -16.74609375, -16.2333984375, -15.720703125, -15.2080078125, -14.6953125, -14.1826171875, -13.669921875, -13.1572265625, -12.64453125, -12.1318359375, -11.619140625, -11.1064453125, -10.59375, -10.0810546875, -9.568359375, -9.0556640625, -8.54296875, -8.0302734375, -7.517578125, -7.0048828125, -6.4921875, -5.9794921875, -5.466796875, -4.9541015625, -4.44140625, -3.9287109375, -3.416015625, -2.9033203125, -2.390625, -1.8779296875, -1.365234375, -0.8525390625, -0.33984375, 0.1728515625, 0.685546875, 1.1982421875, 1.7109375, 2.2236328125, 2.736328125, 3.2490234375, 3.76171875, 4.2744140625, 4.787109375, 5.2998046875, 5.8125, 6.3251953125, 6.837890625, 7.3505859375, 7.86328125, 8.3759765625, 8.888671875, 9.4013671875, 9.9140625, 10.4267578125, 10.939453125, 11.4521484375, 11.96484375, 12.4775390625, 12.990234375, 13.5029296875, 14.015625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 12.0, 18.0, 28.0, 42.0, 65.0, 99.0, 177.0, 398.0, 1761.0, 64863.0, 4070773.0, 53575.0, 1639.0, 336.0, 189.0, 103.0, 57.0, 41.0, 29.0, 24.0, 15.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.375, -51.6240234375, -49.873046875, -48.1220703125, -46.37109375, -44.6201171875, -42.869140625, -41.1181640625, -39.3671875, -37.6162109375, -35.865234375, -34.1142578125, -32.36328125, -30.6123046875, -28.861328125, -27.1103515625, -25.359375, -23.6083984375, -21.857421875, -20.1064453125, -18.35546875, -16.6044921875, -14.853515625, -13.1025390625, -11.3515625, -9.6005859375, -7.849609375, -6.0986328125, -4.34765625, -2.5966796875, -0.845703125, 0.9052734375, 2.65625, 4.4072265625, 6.158203125, 7.9091796875, 9.66015625, 11.4111328125, 13.162109375, 14.9130859375, 16.6640625, 18.4150390625, 20.166015625, 21.9169921875, 23.66796875, 25.4189453125, 27.169921875, 28.9208984375, 30.671875, 32.4228515625, 34.173828125, 35.9248046875, 37.67578125, 39.4267578125, 41.177734375, 42.9287109375, 44.6796875, 46.4306640625, 48.181640625, 49.9326171875, 51.68359375, 53.4345703125, 55.185546875, 56.9365234375, 58.6875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 27.0, 66.0, 154.0, 232.0, 251.0, 140.0, 102.0, 24.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.12625122070312, -67.08890533447266, -64.05156707763672, -61.01422119140625, -57.97688293457031, -54.939537048339844, -51.90219497680664, -48.86485290527344, -45.827510833740234, -42.79016876220703, -39.75282669067383, -36.715484619140625, -33.678138732910156, -30.640798568725586, -27.60345458984375, -24.566112518310547, -21.528770446777344, -18.49142837524414, -15.454085350036621, -12.416742324829102, -9.379400253295898, -6.342058181762695, -3.3047142028808594, -0.26737213134765625, 2.769969940185547, 5.807312488555908, 8.84465503692627, 11.881998062133789, 14.919340133666992, 17.956682205200195, 20.99402618408203, 24.031368255615234, 27.068702697753906, 30.10604476928711, 33.14338684082031, 36.18073272705078, 39.21807098388672, 42.25541687011719, 45.29275894165039, 48.330101013183594, 51.3674430847168, 54.40478515625, 57.4421272277832, 60.479469299316406, 63.516815185546875, 66.55415344238281, 69.59149932861328, 72.62884521484375, 75.66618347167969, 78.70352935791016, 81.7408676147461, 84.77821350097656, 87.8155517578125, 90.85289764404297, 93.89024353027344, 96.92758178710938, 99.96492004394531, 103.00226593017578, 106.03960418701172, 109.07695007324219, 112.11428833007812, 115.1516342163086, 118.18898010253906, 121.226318359375, 124.26366424560547]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 6.0, 5.0, 5.0, 7.0, 9.0, 5.0, 14.0, 13.0, 18.0, 25.0, 33.0, 24.0, 24.0, 41.0, 28.0, 39.0, 32.0, 40.0, 42.0, 38.0, 34.0, 37.0, 43.0, 42.0, 35.0, 32.0, 32.0, 35.0, 34.0, 26.0, 28.0, 27.0, 24.0, 17.0, 13.0, 9.0, 15.0, 18.0, 16.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-40.74736022949219, -39.589813232421875, -38.4322624206543, -37.27471160888672, -36.117164611816406, -34.959617614746094, -33.802066802978516, -32.64451599121094, -31.486968994140625, -30.32942008972168, -29.171871185302734, -28.01432228088379, -26.856773376464844, -25.6992244720459, -24.541675567626953, -23.384126663208008, -22.226577758789062, -21.069028854370117, -19.911479949951172, -18.753931045532227, -17.59638214111328, -16.438833236694336, -15.28128433227539, -14.123735427856445, -12.9661865234375, -11.808637619018555, -10.65108871459961, -9.493539810180664, -8.335990905761719, -7.178442001342773, -6.020893096923828, -4.863344192504883, -3.705791473388672, -2.5482425689697266, -1.3906936645507812, -0.23314476013183594, 0.9244041442871094, 2.0819530487060547, 3.239501953125, 4.397050857543945, 5.554599761962891, 6.712148666381836, 7.869697570800781, 9.027246475219727, 10.184795379638672, 11.342344284057617, 12.499893188476562, 13.657442092895508, 14.814990997314453, 15.972539901733398, 17.130088806152344, 18.28763771057129, 19.445186614990234, 20.60273551940918, 21.760284423828125, 22.91783332824707, 24.075382232666016, 25.23293113708496, 26.390480041503906, 27.54802894592285, 28.705577850341797, 29.863126754760742, 31.020675659179688, 32.17822265625, 33.33577346801758]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 13.0, 14.0, 18.0, 19.0, 13.0, 17.0, 27.0, 23.0, 40.0, 31.0, 29.0, 32.0, 52.0, 44.0, 49.0, 49.0, 38.0, 49.0, 50.0, 41.0, 38.0, 40.0, 31.0, 34.0, 29.0, 33.0, 17.0, 22.0, 6.0, 18.0, 8.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.93463134765625, -3.8067626953125, -3.67889404296875, -3.551025390625, -3.42315673828125, -3.2952880859375, -3.16741943359375, -3.03955078125, -2.91168212890625, -2.7838134765625, -2.65594482421875, -2.528076171875, -2.40020751953125, -2.2723388671875, -2.14447021484375, -2.0166015625, -1.88873291015625, -1.7608642578125, -1.63299560546875, -1.505126953125, -1.37725830078125, -1.2493896484375, -1.12152099609375, -0.99365234375, -0.86578369140625, -0.7379150390625, -0.61004638671875, -0.482177734375, -0.35430908203125, -0.2264404296875, -0.09857177734375, 0.029296875, 0.15716552734375, 0.2850341796875, 0.41290283203125, 0.540771484375, 0.66864013671875, 0.7965087890625, 0.92437744140625, 1.05224609375, 1.18011474609375, 1.3079833984375, 1.43585205078125, 1.563720703125, 1.69158935546875, 1.8194580078125, 1.94732666015625, 2.0751953125, 2.20306396484375, 2.3309326171875, 2.45880126953125, 2.586669921875, 2.71453857421875, 2.8424072265625, 2.97027587890625, 3.09814453125, 3.22601318359375, 3.3538818359375, 3.48175048828125, 3.609619140625, 3.73748779296875, 3.8653564453125, 3.99322509765625, 4.12109375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 9.0, 11.0, 24.0, 19.0, 43.0, 54.0, 95.0, 123.0, 180.0, 267.0, 423.0, 668.0, 1121.0, 1766.0, 3096.0, 5136.0, 8884.0, 15481.0, 27102.0, 50508.0, 98507.0, 201509.0, 283850.0, 168604.0, 82436.0, 43016.0, 23261.0, 13201.0, 7738.0, 4427.0, 2608.0, 1640.0, 1004.0, 643.0, 386.0, 234.0, 170.0, 95.0, 69.0, 43.0, 32.0, 26.0, 9.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6594390869140625, -0.637725830078125, -0.6160125732421875, -0.59429931640625, -0.5725860595703125, -0.550872802734375, -0.5291595458984375, -0.5074462890625, -0.4857330322265625, -0.464019775390625, -0.4423065185546875, -0.42059326171875, -0.3988800048828125, -0.377166748046875, -0.3554534912109375, -0.333740234375, -0.3120269775390625, -0.290313720703125, -0.2686004638671875, -0.24688720703125, -0.2251739501953125, -0.203460693359375, -0.1817474365234375, -0.1600341796875, -0.1383209228515625, -0.116607666015625, -0.0948944091796875, -0.07318115234375, -0.0514678955078125, -0.029754638671875, -0.0080413818359375, 0.013671875, 0.0353851318359375, 0.057098388671875, 0.0788116455078125, 0.10052490234375, 0.1222381591796875, 0.143951416015625, 0.1656646728515625, 0.1873779296875, 0.2090911865234375, 0.230804443359375, 0.2525177001953125, 0.27423095703125, 0.2959442138671875, 0.317657470703125, 0.3393707275390625, 0.361083984375, 0.3827972412109375, 0.404510498046875, 0.4262237548828125, 0.44793701171875, 0.4696502685546875, 0.491363525390625, 0.5130767822265625, 0.5347900390625, 0.5565032958984375, 0.578216552734375, 0.5999298095703125, 0.62164306640625, 0.6433563232421875, 0.665069580078125, 0.6867828369140625, 0.70849609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 5.0, 6.0, 8.0, 7.0, 20.0, 15.0, 15.0, 16.0, 20.0, 26.0, 28.0, 28.0, 38.0, 25.0, 30.0, 37.0, 50.0, 42.0, 40.0, 34.0, 1046.0, 31.0, 33.0, 35.0, 37.0, 43.0, 31.0, 45.0, 33.0, 26.0, 25.0, 15.0, 17.0, 17.0, 17.0, 15.0, 12.0, 10.0, 10.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0], "bins": [-2.57421875, -2.503326416015625, -2.43243408203125, -2.361541748046875, -2.2906494140625, -2.219757080078125, -2.14886474609375, -2.077972412109375, -2.007080078125, -1.936187744140625, -1.86529541015625, -1.794403076171875, -1.7235107421875, -1.652618408203125, -1.58172607421875, -1.510833740234375, -1.43994140625, -1.369049072265625, -1.29815673828125, -1.227264404296875, -1.1563720703125, -1.085479736328125, -1.01458740234375, -0.943695068359375, -0.872802734375, -0.801910400390625, -0.73101806640625, -0.660125732421875, -0.5892333984375, -0.518341064453125, -0.44744873046875, -0.376556396484375, -0.3056640625, -0.234771728515625, -0.16387939453125, -0.092987060546875, -0.0220947265625, 0.048797607421875, 0.11968994140625, 0.190582275390625, 0.261474609375, 0.332366943359375, 0.40325927734375, 0.474151611328125, 0.5450439453125, 0.615936279296875, 0.68682861328125, 0.757720947265625, 0.82861328125, 0.899505615234375, 0.97039794921875, 1.041290283203125, 1.1121826171875, 1.183074951171875, 1.25396728515625, 1.324859619140625, 1.395751953125, 1.466644287109375, 1.53753662109375, 1.608428955078125, 1.6793212890625, 1.750213623046875, 1.82110595703125, 1.891998291015625, 1.962890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 5.0, 8.0, 12.0, 21.0, 35.0, 55.0, 77.0, 107.0, 175.0, 326.0, 504.0, 779.0, 1194.0, 2080.0, 3282.0, 5545.0, 9419.0, 16180.0, 28295.0, 50109.0, 91348.0, 169611.0, 1292761.0, 188776.0, 103721.0, 56629.0, 31849.0, 17954.0, 10456.0, 6228.0, 3785.0, 2150.0, 1350.0, 824.0, 509.0, 350.0, 216.0, 138.0, 81.0, 69.0, 41.0, 28.0, 14.0, 12.0, 7.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.471923828125, -0.45787811279296875, -0.4438323974609375, -0.42978668212890625, -0.415740966796875, -0.40169525146484375, -0.3876495361328125, -0.37360382080078125, -0.35955810546875, -0.34551239013671875, -0.3314666748046875, -0.31742095947265625, -0.303375244140625, -0.28932952880859375, -0.2752838134765625, -0.26123809814453125, -0.2471923828125, -0.23314666748046875, -0.2191009521484375, -0.20505523681640625, -0.191009521484375, -0.17696380615234375, -0.1629180908203125, -0.14887237548828125, -0.13482666015625, -0.12078094482421875, -0.1067352294921875, -0.09268951416015625, -0.078643798828125, -0.06459808349609375, -0.0505523681640625, -0.03650665283203125, -0.0224609375, -0.00841522216796875, 0.0056304931640625, 0.01967620849609375, 0.033721923828125, 0.04776763916015625, 0.0618133544921875, 0.07585906982421875, 0.08990478515625, 0.10395050048828125, 0.1179962158203125, 0.13204193115234375, 0.146087646484375, 0.16013336181640625, 0.1741790771484375, 0.18822479248046875, 0.2022705078125, 0.21631622314453125, 0.2303619384765625, 0.24440765380859375, 0.258453369140625, 0.27249908447265625, 0.2865447998046875, 0.30059051513671875, 0.31463623046875, 0.32868194580078125, 0.3427276611328125, 0.35677337646484375, 0.370819091796875, 0.38486480712890625, 0.3989105224609375, 0.41295623779296875, 0.427001953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 14.0, 9.0, 12.0, 18.0, 12.0, 25.0, 31.0, 37.0, 45.0, 55.0, 70.0, 69.0, 78.0, 79.0, 77.0, 64.0, 57.0, 39.0, 38.0, 35.0, 20.0, 18.0, 17.0, 10.0, 4.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021152496337890625, -0.002048969268798828, -0.0019826889038085938, -0.0019164085388183594, -0.001850128173828125, -0.0017838478088378906, -0.0017175674438476562, -0.0016512870788574219, -0.0015850067138671875, -0.0015187263488769531, -0.0014524459838867188, -0.0013861656188964844, -0.00131988525390625, -0.0012536048889160156, -0.0011873245239257812, -0.0011210441589355469, -0.0010547637939453125, -0.0009884834289550781, -0.0009222030639648438, -0.0008559226989746094, -0.000789642333984375, -0.0007233619689941406, -0.0006570816040039062, -0.0005908012390136719, -0.0005245208740234375, -0.0004582405090332031, -0.00039196014404296875, -0.0003256797790527344, -0.0002593994140625, -0.00019311904907226562, -0.00012683868408203125, -6.0558319091796875e-05, 5.7220458984375e-06, 7.200241088867188e-05, 0.00013828277587890625, 0.00020456314086914062, 0.000270843505859375, 0.0003371238708496094, 0.00040340423583984375, 0.0004696846008300781, 0.0005359649658203125, 0.0006022453308105469, 0.0006685256958007812, 0.0007348060607910156, 0.00080108642578125, 0.0008673667907714844, 0.0009336471557617188, 0.0009999275207519531, 0.0010662078857421875, 0.0011324882507324219, 0.0011987686157226562, 0.0012650489807128906, 0.001331329345703125, 0.0013976097106933594, 0.0014638900756835938, 0.0015301704406738281, 0.0015964508056640625, 0.0016627311706542969, 0.0017290115356445312, 0.0017952919006347656, 0.001861572265625, 0.0019278526306152344, 0.0019941329956054688, 0.002060413360595703, 0.0021266937255859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 13.0, 17.0, 16.0, 27.0, 49.0, 84.0, 125.0, 227.0, 542.0, 3579.0, 1039957.0, 2735.0, 486.0, 257.0, 133.0, 73.0, 41.0, 28.0, 27.0, 16.0, 8.0, 13.0, 11.0, 14.0, 3.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05749940872192383, -0.055672645568847656, -0.053845882415771484, -0.05201911926269531, -0.05019235610961914, -0.04836559295654297, -0.0465388298034668, -0.044712066650390625, -0.04288530349731445, -0.04105854034423828, -0.03923177719116211, -0.03740501403808594, -0.035578250885009766, -0.033751487731933594, -0.03192472457885742, -0.03009796142578125, -0.028271198272705078, -0.026444435119628906, -0.024617671966552734, -0.022790908813476562, -0.02096414566040039, -0.01913738250732422, -0.017310619354248047, -0.015483856201171875, -0.013657093048095703, -0.011830329895019531, -0.01000356674194336, -0.008176803588867188, -0.006350040435791016, -0.004523277282714844, -0.002696514129638672, -0.0008697509765625, 0.0009570121765136719, 0.0027837753295898438, 0.004610538482666016, 0.0064373016357421875, 0.00826406478881836, 0.010090827941894531, 0.011917591094970703, 0.013744354248046875, 0.015571117401123047, 0.01739788055419922, 0.01922464370727539, 0.021051406860351562, 0.022878170013427734, 0.024704933166503906, 0.026531696319580078, 0.02835845947265625, 0.030185222625732422, 0.032011985778808594, 0.033838748931884766, 0.03566551208496094, 0.03749227523803711, 0.03931903839111328, 0.04114580154418945, 0.042972564697265625, 0.0447993278503418, 0.04662609100341797, 0.04845285415649414, 0.05027961730957031, 0.052106380462646484, 0.053933143615722656, 0.05575990676879883, 0.057586669921875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 80.0, 939.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005784960929304361, -0.004382389597594738, -0.002979818033054471, -0.001577246468514204, -0.0001746751368045807, 0.0012278961949050426, 0.0026304679922759533, 0.004033038858324289, 0.0054356106556952, 0.006838181987404823, 0.008240753784775734, 0.009643325582146645, 0.01104589644819498, 0.012448467314243317, 0.013851039111614227, 0.015253610908985138, 0.01665618270635605, 0.01805875450372696, 0.01946132630109787, 0.02086389809846878, 0.022266468033194542, 0.023669039830565453, 0.025071611627936363, 0.026474181562662125, 0.027876753360033035, 0.029279325157403946, 0.030681896954774857, 0.03208446875214577, 0.03348704054951668, 0.03488960862159729, 0.0362921804189682, 0.03769475221633911, 0.03909732773900032, 0.04049989953637123, 0.04190247133374214, 0.04330504313111305, 0.04470761492848396, 0.046110183000564575, 0.047512754797935486, 0.048915326595306396, 0.05031789839267731, 0.05172047019004822, 0.05312304198741913, 0.05452561378479004, 0.05592818558216095, 0.05733075737953186, 0.05873332917690277, 0.06013589724898338, 0.06153847277164459, 0.0629410445690155, 0.06434361636638641, 0.06574618816375732, 0.06714875996112823, 0.06855133175849915, 0.06995390355587006, 0.07135647535324097, 0.07275903970003128, 0.07416161149740219, 0.0755641832947731, 0.07696675509214401, 0.07836932688951492, 0.07977189868688583, 0.08117447048425674, 0.08257704228162766, 0.08397961407899857]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 13.0, 26.0, 32.0, 42.0, 39.0, 47.0, 48.0, 55.0, 65.0, 66.0, 67.0, 72.0, 77.0, 62.0, 63.0, 42.0, 26.0, 27.0, 31.0, 19.0, 17.0, 9.0, 14.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022071003913879395, -0.0021561840549111366, -0.002105267718434334, -0.002054351381957531, -0.002003435045480728, -0.0019525187090039253, -0.0019016023725271225, -0.0018506860360503197, -0.0017997696995735168, -0.001748853363096714, -0.0016979370266199112, -0.0016470206901431084, -0.0015961043536663055, -0.0015451880171895027, -0.0014942716807126999, -0.001443355344235897, -0.0013924390077590942, -0.0013415226712822914, -0.0012906063348054886, -0.0012396899983286858, -0.001188773661851883, -0.0011378573253750801, -0.0010869409888982773, -0.0010360246524214745, -0.0009851083159446716, -0.0009341919794678688, -0.000883275642991066, -0.0008323593065142632, -0.0007814429700374603, -0.0007305266335606575, -0.0006796102970838547, -0.0006286939606070518, -0.000577777624130249, -0.0005268612876534462, -0.00047594495117664337, -0.00042502861469984055, -0.0003741122782230377, -0.0003231959417462349, -0.00027227960526943207, -0.00022136326879262924, -0.00017044693231582642, -0.00011953059583902359, -6.861425936222076e-05, -1.7697922885417938e-05, 3.321841359138489e-05, 8.413475006818771e-05, 0.00013505108654499054, 0.00018596742302179337, 0.0002368837594985962, 0.000287800095975399, 0.00033871643245220184, 0.00038963276892900467, 0.0004405491054058075, 0.0004914654418826103, 0.0005423817783594131, 0.000593298114836216, 0.0006442144513130188, 0.0006951307877898216, 0.0007460471242666245, 0.0007969634607434273, 0.0008478797972202301, 0.0008987961336970329, 0.0009497124701738358, 0.0010006288066506386, 0.0010515451431274414]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 13.0, 14.0, 18.0, 19.0, 13.0, 17.0, 27.0, 23.0, 40.0, 31.0, 29.0, 32.0, 52.0, 44.0, 49.0, 49.0, 38.0, 49.0, 50.0, 41.0, 38.0, 40.0, 31.0, 34.0, 29.0, 33.0, 17.0, 22.0, 6.0, 18.0, 8.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.93463134765625, -3.8067626953125, -3.67889404296875, -3.551025390625, -3.42315673828125, -3.2952880859375, -3.16741943359375, -3.03955078125, -2.91168212890625, -2.7838134765625, -2.65594482421875, -2.528076171875, -2.40020751953125, -2.2723388671875, -2.14447021484375, -2.0166015625, -1.88873291015625, -1.7608642578125, -1.63299560546875, -1.505126953125, -1.37725830078125, -1.2493896484375, -1.12152099609375, -0.99365234375, -0.86578369140625, -0.7379150390625, -0.61004638671875, -0.482177734375, -0.35430908203125, -0.2264404296875, -0.09857177734375, 0.029296875, 0.15716552734375, 0.2850341796875, 0.41290283203125, 0.540771484375, 0.66864013671875, 0.7965087890625, 0.92437744140625, 1.05224609375, 1.18011474609375, 1.3079833984375, 1.43585205078125, 1.563720703125, 1.69158935546875, 1.8194580078125, 1.94732666015625, 2.0751953125, 2.20306396484375, 2.3309326171875, 2.45880126953125, 2.586669921875, 2.71453857421875, 2.8424072265625, 2.97027587890625, 3.09814453125, 3.22601318359375, 3.3538818359375, 3.48175048828125, 3.609619140625, 3.73748779296875, 3.8653564453125, 3.99322509765625, 4.12109375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 9.0, 2.0, 12.0, 7.0, 15.0, 18.0, 35.0, 24.0, 54.0, 78.0, 135.0, 183.0, 356.0, 539.0, 909.0, 1592.0, 2904.0, 5377.0, 9890.0, 21155.0, 47447.0, 122927.0, 320665.0, 309943.0, 116403.0, 45790.0, 20528.0, 9983.0, 4999.0, 2728.0, 1513.0, 920.0, 508.0, 303.0, 198.0, 140.0, 76.0, 61.0, 37.0, 34.0, 15.0, 14.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.47479248046875, -2.3948974609375, -2.31500244140625, -2.235107421875, -2.15521240234375, -2.0753173828125, -1.99542236328125, -1.91552734375, -1.83563232421875, -1.7557373046875, -1.67584228515625, -1.595947265625, -1.51605224609375, -1.4361572265625, -1.35626220703125, -1.2763671875, -1.19647216796875, -1.1165771484375, -1.03668212890625, -0.956787109375, -0.87689208984375, -0.7969970703125, -0.71710205078125, -0.63720703125, -0.55731201171875, -0.4774169921875, -0.39752197265625, -0.317626953125, -0.23773193359375, -0.1578369140625, -0.07794189453125, 0.001953125, 0.08184814453125, 0.1617431640625, 0.24163818359375, 0.321533203125, 0.40142822265625, 0.4813232421875, 0.56121826171875, 0.64111328125, 0.72100830078125, 0.8009033203125, 0.88079833984375, 0.960693359375, 1.04058837890625, 1.1204833984375, 1.20037841796875, 1.2802734375, 1.36016845703125, 1.4400634765625, 1.51995849609375, 1.599853515625, 1.67974853515625, 1.7596435546875, 1.83953857421875, 1.91943359375, 1.99932861328125, 2.0792236328125, 2.15911865234375, 2.239013671875, 2.31890869140625, 2.3988037109375, 2.47869873046875, 2.55859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 5.0, 5.0, 9.0, 19.0, 12.0, 18.0, 22.0, 30.0, 27.0, 28.0, 37.0, 39.0, 44.0, 37.0, 44.0, 53.0, 73.0, 236.0, 1699.0, 140.0, 63.0, 60.0, 54.0, 41.0, 36.0, 32.0, 22.0, 24.0, 21.0, 20.0, 25.0, 16.0, 14.0, 6.0, 6.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.9615478515625, -13.501220703125, -13.0408935546875, -12.58056640625, -12.1202392578125, -11.659912109375, -11.1995849609375, -10.7392578125, -10.2789306640625, -9.818603515625, -9.3582763671875, -8.89794921875, -8.4376220703125, -7.977294921875, -7.5169677734375, -7.056640625, -6.5963134765625, -6.135986328125, -5.6756591796875, -5.21533203125, -4.7550048828125, -4.294677734375, -3.8343505859375, -3.3740234375, -2.9136962890625, -2.453369140625, -1.9930419921875, -1.53271484375, -1.0723876953125, -0.612060546875, -0.1517333984375, 0.30859375, 0.7689208984375, 1.229248046875, 1.6895751953125, 2.14990234375, 2.6102294921875, 3.070556640625, 3.5308837890625, 3.9912109375, 4.4515380859375, 4.911865234375, 5.3721923828125, 5.83251953125, 6.2928466796875, 6.753173828125, 7.2135009765625, 7.673828125, 8.1341552734375, 8.594482421875, 9.0548095703125, 9.51513671875, 9.9754638671875, 10.435791015625, 10.8961181640625, 11.3564453125, 11.8167724609375, 12.277099609375, 12.7374267578125, 13.19775390625, 13.6580810546875, 14.118408203125, 14.5787353515625, 15.0390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 5.0, 12.0, 13.0, 24.0, 25.0, 21.0, 34.0, 31.0, 50.0, 83.0, 132.0, 185.0, 299.0, 672.0, 3459.0, 207884.0, 2920189.0, 10299.0, 1104.0, 402.0, 210.0, 151.0, 87.0, 62.0, 53.0, 27.0, 47.0, 23.0, 25.0, 17.0, 17.0, 12.0, 11.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.65625, -23.890380859375, -23.12451171875, -22.358642578125, -21.5927734375, -20.826904296875, -20.06103515625, -19.295166015625, -18.529296875, -17.763427734375, -16.99755859375, -16.231689453125, -15.4658203125, -14.699951171875, -13.93408203125, -13.168212890625, -12.40234375, -11.636474609375, -10.87060546875, -10.104736328125, -9.3388671875, -8.572998046875, -7.80712890625, -7.041259765625, -6.275390625, -5.509521484375, -4.74365234375, -3.977783203125, -3.2119140625, -2.446044921875, -1.68017578125, -0.914306640625, -0.1484375, 0.617431640625, 1.38330078125, 2.149169921875, 2.9150390625, 3.680908203125, 4.44677734375, 5.212646484375, 5.978515625, 6.744384765625, 7.51025390625, 8.276123046875, 9.0419921875, 9.807861328125, 10.57373046875, 11.339599609375, 12.10546875, 12.871337890625, 13.63720703125, 14.403076171875, 15.1689453125, 15.934814453125, 16.70068359375, 17.466552734375, 18.232421875, 18.998291015625, 19.76416015625, 20.530029296875, 21.2958984375, 22.061767578125, 22.82763671875, 23.593505859375, 24.359375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 330.0, 642.0, 35.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.857102394104004, -7.4332780838012695, -4.009453773498535, -0.5856294631958008, 2.8381948471069336, 6.262019157409668, 9.685843467712402, 13.109667778015137, 16.533493041992188, 19.957317352294922, 23.381141662597656, 26.80496597290039, 30.228790283203125, 33.65261459350586, 37.076438903808594, 40.50026321411133, 43.92408752441406, 47.3479118347168, 50.77173614501953, 54.195560455322266, 57.619384765625, 61.043209075927734, 64.46703338623047, 67.89085388183594, 71.31468200683594, 74.73851013183594, 78.1623306274414, 81.58615112304688, 85.00997924804688, 88.43380737304688, 91.85762786865234, 95.28144836425781, 98.70527648925781, 102.12910461425781, 105.55292510986328, 108.97674560546875, 112.40057373046875, 115.82440185546875, 119.24822235107422, 122.67204284667969, 126.09587097167969, 129.5196990966797, 132.94351196289062, 136.36734008789062, 139.79116821289062, 143.21499633789062, 146.63882446289062, 150.06263732910156, 153.48646545410156, 156.91029357910156, 160.3341064453125, 163.7579345703125, 167.1817626953125, 170.6055908203125, 174.0294189453125, 177.45323181152344, 180.87705993652344, 184.30088806152344, 187.72470092773438, 191.14852905273438, 194.57235717773438, 197.99618530273438, 201.42001342773438, 204.8438262939453, 208.2676544189453]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 10.0, 7.0, 11.0, 13.0, 11.0, 12.0, 17.0, 23.0, 14.0, 27.0, 22.0, 21.0, 41.0, 27.0, 36.0, 39.0, 43.0, 42.0, 41.0, 45.0, 35.0, 48.0, 33.0, 42.0, 31.0, 36.0, 26.0, 34.0, 26.0, 29.0, 29.0, 15.0, 14.0, 12.0, 14.0, 15.0, 12.0, 7.0, 10.0, 6.0, 9.0, 5.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.402992248535156, -45.00642395019531, -43.6098518371582, -42.21328353881836, -40.816715240478516, -39.420143127441406, -38.02357482910156, -36.62700653076172, -35.230438232421875, -33.83386993408203, -32.43729782104492, -31.040729522705078, -29.644161224365234, -28.247591018676758, -26.85102081298828, -25.454452514648438, -24.057880401611328, -22.66131019592285, -21.264741897583008, -19.86817169189453, -18.471603393554688, -17.07503318786621, -15.678462982177734, -14.281893730163574, -12.885324478149414, -11.488755226135254, -10.092185974121094, -8.695615768432617, -7.299046516418457, -5.902477264404297, -4.50590705871582, -3.10933780670166, -1.7127685546875, -0.31619906425476074, 1.0803704261779785, 2.476940155029297, 3.873509407043457, 5.270078659057617, 6.666648864746094, 8.063218116760254, 9.459787368774414, 10.856356620788574, 12.252925872802734, 13.649496078491211, 15.046065330505371, 16.44263458251953, 17.839204788208008, 19.235774993896484, 20.632343292236328, 22.028913497924805, 23.42548179626465, 24.822052001953125, 26.21862030029297, 27.615190505981445, 29.011760711669922, 30.408329010009766, 31.804899215698242, 33.20146942138672, 34.59803771972656, 35.994606018066406, 37.391178131103516, 38.78774642944336, 40.18431854248047, 41.58088684082031, 42.977455139160156]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 5.0, 7.0, 6.0, 10.0, 7.0, 12.0, 21.0, 14.0, 23.0, 22.0, 21.0, 24.0, 26.0, 31.0, 43.0, 40.0, 34.0, 38.0, 47.0, 42.0, 49.0, 42.0, 48.0, 35.0, 39.0, 44.0, 29.0, 40.0, 36.0, 29.0, 18.0, 19.0, 15.0, 17.0, 11.0, 9.0, 15.0, 5.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.984375, -3.8560791015625, -3.727783203125, -3.5994873046875, -3.47119140625, -3.3428955078125, -3.214599609375, -3.0863037109375, -2.9580078125, -2.8297119140625, -2.701416015625, -2.5731201171875, -2.44482421875, -2.3165283203125, -2.188232421875, -2.0599365234375, -1.931640625, -1.8033447265625, -1.675048828125, -1.5467529296875, -1.41845703125, -1.2901611328125, -1.161865234375, -1.0335693359375, -0.9052734375, -0.7769775390625, -0.648681640625, -0.5203857421875, -0.39208984375, -0.2637939453125, -0.135498046875, -0.0072021484375, 0.12109375, 0.2493896484375, 0.377685546875, 0.5059814453125, 0.63427734375, 0.7625732421875, 0.890869140625, 1.0191650390625, 1.1474609375, 1.2757568359375, 1.404052734375, 1.5323486328125, 1.66064453125, 1.7889404296875, 1.917236328125, 2.0455322265625, 2.173828125, 2.3021240234375, 2.430419921875, 2.5587158203125, 2.68701171875, 2.8153076171875, 2.943603515625, 3.0718994140625, 3.2001953125, 3.3284912109375, 3.456787109375, 3.5850830078125, 3.71337890625, 3.8416748046875, 3.969970703125, 4.0982666015625, 4.2265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 9.0, 7.0, 8.0, 6.0, 11.0, 12.0, 20.0, 18.0, 28.0, 36.0, 42.0, 48.0, 96.0, 196.0, 458.0, 1461.0, 6701.0, 40312.0, 499362.0, 3050256.0, 543206.0, 42409.0, 6941.0, 1546.0, 508.0, 205.0, 96.0, 74.0, 38.0, 35.0, 34.0, 28.0, 17.0, 13.0, 7.0, 8.0, 8.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.890625, -12.494140625, -12.09765625, -11.701171875, -11.3046875, -10.908203125, -10.51171875, -10.115234375, -9.71875, -9.322265625, -8.92578125, -8.529296875, -8.1328125, -7.736328125, -7.33984375, -6.943359375, -6.546875, -6.150390625, -5.75390625, -5.357421875, -4.9609375, -4.564453125, -4.16796875, -3.771484375, -3.375, -2.978515625, -2.58203125, -2.185546875, -1.7890625, -1.392578125, -0.99609375, -0.599609375, -0.203125, 0.193359375, 0.58984375, 0.986328125, 1.3828125, 1.779296875, 2.17578125, 2.572265625, 2.96875, 3.365234375, 3.76171875, 4.158203125, 4.5546875, 4.951171875, 5.34765625, 5.744140625, 6.140625, 6.537109375, 6.93359375, 7.330078125, 7.7265625, 8.123046875, 8.51953125, 8.916015625, 9.3125, 9.708984375, 10.10546875, 10.501953125, 10.8984375, 11.294921875, 11.69140625, 12.087890625, 12.484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 3.0, 10.0, 16.0, 15.0, 41.0, 54.0, 85.0, 121.0, 185.0, 301.0, 388.0, 592.0, 662.0, 529.0, 366.0, 248.0, 166.0, 110.0, 55.0, 47.0, 28.0, 15.0, 14.0, 9.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.46875, -13.974365234375, -13.47998046875, -12.985595703125, -12.4912109375, -11.996826171875, -11.50244140625, -11.008056640625, -10.513671875, -10.019287109375, -9.52490234375, -9.030517578125, -8.5361328125, -8.041748046875, -7.54736328125, -7.052978515625, -6.55859375, -6.064208984375, -5.56982421875, -5.075439453125, -4.5810546875, -4.086669921875, -3.59228515625, -3.097900390625, -2.603515625, -2.109130859375, -1.61474609375, -1.120361328125, -0.6259765625, -0.131591796875, 0.36279296875, 0.857177734375, 1.3515625, 1.845947265625, 2.34033203125, 2.834716796875, 3.3291015625, 3.823486328125, 4.31787109375, 4.812255859375, 5.306640625, 5.801025390625, 6.29541015625, 6.789794921875, 7.2841796875, 7.778564453125, 8.27294921875, 8.767333984375, 9.26171875, 9.756103515625, 10.25048828125, 10.744873046875, 11.2392578125, 11.733642578125, 12.22802734375, 12.722412109375, 13.216796875, 13.711181640625, 14.20556640625, 14.699951171875, 15.1943359375, 15.688720703125, 16.18310546875, 16.677490234375, 17.171875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 4.0, 14.0, 11.0, 18.0, 25.0, 31.0, 40.0, 65.0, 81.0, 109.0, 152.0, 281.0, 484.0, 1401.0, 9460.0, 355110.0, 3735260.0, 85421.0, 4204.0, 959.0, 402.0, 204.0, 145.0, 100.0, 86.0, 49.0, 40.0, 30.0, 20.0, 15.0, 10.0, 10.0, 10.0, 10.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.9052734375, -30.779296875, -29.6533203125, -28.52734375, -27.4013671875, -26.275390625, -25.1494140625, -24.0234375, -22.8974609375, -21.771484375, -20.6455078125, -19.51953125, -18.3935546875, -17.267578125, -16.1416015625, -15.015625, -13.8896484375, -12.763671875, -11.6376953125, -10.51171875, -9.3857421875, -8.259765625, -7.1337890625, -6.0078125, -4.8818359375, -3.755859375, -2.6298828125, -1.50390625, -0.3779296875, 0.748046875, 1.8740234375, 3.0, 4.1259765625, 5.251953125, 6.3779296875, 7.50390625, 8.6298828125, 9.755859375, 10.8818359375, 12.0078125, 13.1337890625, 14.259765625, 15.3857421875, 16.51171875, 17.6376953125, 18.763671875, 19.8896484375, 21.015625, 22.1416015625, 23.267578125, 24.3935546875, 25.51953125, 26.6455078125, 27.771484375, 28.8974609375, 30.0234375, 31.1494140625, 32.275390625, 33.4013671875, 34.52734375, 35.6533203125, 36.779296875, 37.9052734375, 39.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 15.0, 21.0, 48.0, 80.0, 110.0, 127.0, 148.0, 139.0, 104.0, 91.0, 49.0, 32.0, 22.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.87782287597656, -66.0169448852539, -64.15605926513672, -62.29518127441406, -60.43429946899414, -58.57341766357422, -56.71253967285156, -54.85165786743164, -52.99077606201172, -51.1298942565918, -49.269012451171875, -47.40813446044922, -45.5472526550293, -43.686370849609375, -41.82549285888672, -39.9646110534668, -38.103729248046875, -36.24284744262695, -34.38196563720703, -32.521087646484375, -30.660205841064453, -28.79932403564453, -26.938444137573242, -25.077564239501953, -23.21668243408203, -21.35580062866211, -19.49492073059082, -17.63404083251953, -15.77315902709961, -13.912278175354004, -12.051397323608398, -10.190516471862793, -8.329639434814453, -6.468758583068848, -4.607877731323242, -2.7469968795776367, -0.8861160278320312, 0.9747648239135742, 2.8356456756591797, 4.696526527404785, 6.557407379150391, 8.418288230895996, 10.279169082641602, 12.140049934387207, 14.000930786132812, 15.861811637878418, 17.722692489624023, 19.583572387695312, 21.444454193115234, 23.305335998535156, 25.166215896606445, 27.027095794677734, 28.887977600097656, 30.748859405517578, 32.6097412109375, 34.470619201660156, 36.33150100708008, 38.1923828125, 40.053260803222656, 41.91414260864258, 43.7750244140625, 45.63590621948242, 47.496788024902344, 49.357666015625, 51.21854782104492]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 11.0, 2.0, 9.0, 5.0, 7.0, 7.0, 10.0, 13.0, 13.0, 25.0, 20.0, 24.0, 18.0, 26.0, 34.0, 35.0, 34.0, 32.0, 34.0, 45.0, 45.0, 42.0, 36.0, 32.0, 37.0, 37.0, 40.0, 45.0, 38.0, 34.0, 26.0, 28.0, 25.0, 24.0, 19.0, 10.0, 14.0, 12.0, 6.0, 12.0, 6.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-37.75487518310547, -36.618038177490234, -35.481201171875, -34.344364166259766, -33.20752716064453, -32.07068634033203, -30.933849334716797, -29.797012329101562, -28.660175323486328, -27.523338317871094, -26.38650131225586, -25.249662399291992, -24.112825393676758, -22.975988388061523, -21.839149475097656, -20.702312469482422, -19.565475463867188, -18.428638458251953, -17.29180145263672, -16.15496253967285, -15.018125534057617, -13.881288528442383, -12.744450569152832, -11.607612609863281, -10.470775604248047, -9.333938598632812, -8.197100639343262, -7.060263156890869, -5.923425674438477, -4.786588191986084, -3.6497507095336914, -2.512913227081299, -1.3760719299316406, -0.23923444747924805, 0.8976030349731445, 2.034440517425537, 3.1712779998779297, 4.308115482330322, 5.444952964782715, 6.581790447235107, 7.7186279296875, 8.855464935302734, 9.992302894592285, 11.129140853881836, 12.26597785949707, 13.402814865112305, 14.539652824401855, 15.676490783691406, 16.81332778930664, 17.950164794921875, 19.08700180053711, 20.223840713500977, 21.36067771911621, 22.497514724731445, 23.634353637695312, 24.771190643310547, 25.90802764892578, 27.044864654541016, 28.18170166015625, 29.318540573120117, 30.45537757873535, 31.592214584350586, 32.72905349731445, 33.86589050292969, 35.00272750854492]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 9.0, 7.0, 3.0, 14.0, 12.0, 13.0, 15.0, 16.0, 27.0, 30.0, 37.0, 18.0, 31.0, 31.0, 38.0, 36.0, 49.0, 32.0, 24.0, 44.0, 39.0, 41.0, 44.0, 39.0, 42.0, 35.0, 35.0, 25.0, 27.0, 32.0, 14.0, 18.0, 21.0, 15.0, 17.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.7734375, -3.6500244140625, -3.526611328125, -3.4031982421875, -3.27978515625, -3.1563720703125, -3.032958984375, -2.9095458984375, -2.7861328125, -2.6627197265625, -2.539306640625, -2.4158935546875, -2.29248046875, -2.1690673828125, -2.045654296875, -1.9222412109375, -1.798828125, -1.6754150390625, -1.552001953125, -1.4285888671875, -1.30517578125, -1.1817626953125, -1.058349609375, -0.9349365234375, -0.8115234375, -0.6881103515625, -0.564697265625, -0.4412841796875, -0.31787109375, -0.1944580078125, -0.071044921875, 0.0523681640625, 0.17578125, 0.2991943359375, 0.422607421875, 0.5460205078125, 0.66943359375, 0.7928466796875, 0.916259765625, 1.0396728515625, 1.1630859375, 1.2864990234375, 1.409912109375, 1.5333251953125, 1.65673828125, 1.7801513671875, 1.903564453125, 2.0269775390625, 2.150390625, 2.2738037109375, 2.397216796875, 2.5206298828125, 2.64404296875, 2.7674560546875, 2.890869140625, 3.0142822265625, 3.1376953125, 3.2611083984375, 3.384521484375, 3.5079345703125, 3.63134765625, 3.7547607421875, 3.878173828125, 4.0015869140625, 4.125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 17.0, 18.0, 32.0, 50.0, 61.0, 95.0, 157.0, 211.0, 340.0, 504.0, 783.0, 1251.0, 2034.0, 3090.0, 4983.0, 8004.0, 12731.0, 20690.0, 34590.0, 60725.0, 116437.0, 220953.0, 247929.0, 138780.0, 71922.0, 39796.0, 23511.0, 14461.0, 9010.0, 5564.0, 3608.0, 2277.0, 1375.0, 909.0, 558.0, 351.0, 243.0, 155.0, 102.0, 66.0, 62.0, 35.0, 17.0, 16.0, 11.0, 9.0, 9.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.6591796875, -0.6386642456054688, -0.6181488037109375, -0.5976333618164062, -0.577117919921875, -0.5566024780273438, -0.5360870361328125, -0.5155715942382812, -0.49505615234375, -0.47454071044921875, -0.4540252685546875, -0.43350982666015625, -0.412994384765625, -0.39247894287109375, -0.3719635009765625, -0.35144805908203125, -0.3309326171875, -0.31041717529296875, -0.2899017333984375, -0.26938629150390625, -0.248870849609375, -0.22835540771484375, -0.2078399658203125, -0.18732452392578125, -0.16680908203125, -0.14629364013671875, -0.1257781982421875, -0.10526275634765625, -0.084747314453125, -0.06423187255859375, -0.0437164306640625, -0.02320098876953125, -0.002685546875, 0.01782989501953125, 0.0383453369140625, 0.05886077880859375, 0.079376220703125, 0.09989166259765625, 0.1204071044921875, 0.14092254638671875, 0.16143798828125, 0.18195343017578125, 0.2024688720703125, 0.22298431396484375, 0.243499755859375, 0.26401519775390625, 0.2845306396484375, 0.30504608154296875, 0.3255615234375, 0.34607696533203125, 0.3665924072265625, 0.38710784912109375, 0.407623291015625, 0.42813873291015625, 0.4486541748046875, 0.46916961669921875, 0.48968505859375, 0.5102005004882812, 0.5307159423828125, 0.5512313842773438, 0.571746826171875, 0.5922622680664062, 0.6127777099609375, 0.6332931518554688, 0.65380859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 10.0, 14.0, 15.0, 22.0, 20.0, 27.0, 35.0, 29.0, 25.0, 36.0, 35.0, 32.0, 47.0, 38.0, 46.0, 44.0, 1074.0, 51.0, 40.0, 38.0, 30.0, 32.0, 39.0, 24.0, 24.0, 24.0, 23.0, 22.0, 17.0, 21.0, 18.0, 12.0, 7.0, 14.0, 10.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.61761474609375, -2.5321044921875, -2.44659423828125, -2.361083984375, -2.27557373046875, -2.1900634765625, -2.10455322265625, -2.01904296875, -1.93353271484375, -1.8480224609375, -1.76251220703125, -1.677001953125, -1.59149169921875, -1.5059814453125, -1.42047119140625, -1.3349609375, -1.24945068359375, -1.1639404296875, -1.07843017578125, -0.992919921875, -0.90740966796875, -0.8218994140625, -0.73638916015625, -0.65087890625, -0.56536865234375, -0.4798583984375, -0.39434814453125, -0.308837890625, -0.22332763671875, -0.1378173828125, -0.05230712890625, 0.033203125, 0.11871337890625, 0.2042236328125, 0.28973388671875, 0.375244140625, 0.46075439453125, 0.5462646484375, 0.63177490234375, 0.71728515625, 0.80279541015625, 0.8883056640625, 0.97381591796875, 1.059326171875, 1.14483642578125, 1.2303466796875, 1.31585693359375, 1.4013671875, 1.48687744140625, 1.5723876953125, 1.65789794921875, 1.743408203125, 1.82891845703125, 1.9144287109375, 1.99993896484375, 2.08544921875, 2.17095947265625, 2.2564697265625, 2.34197998046875, 2.427490234375, 2.51300048828125, 2.5985107421875, 2.68402099609375, 2.76953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 14.0, 17.0, 15.0, 23.0, 50.0, 88.0, 123.0, 186.0, 260.0, 460.0, 639.0, 1136.0, 1865.0, 2957.0, 4740.0, 8229.0, 14020.0, 24567.0, 44494.0, 82109.0, 150275.0, 1280807.0, 208124.0, 120739.0, 66204.0, 36189.0, 20022.0, 11507.0, 6784.0, 3896.0, 2558.0, 1496.0, 970.0, 566.0, 355.0, 241.0, 150.0, 86.0, 49.0, 47.0, 31.0, 18.0, 6.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.47607421875, -0.46111297607421875, -0.4461517333984375, -0.43119049072265625, -0.416229248046875, -0.40126800537109375, -0.3863067626953125, -0.37134552001953125, -0.35638427734375, -0.34142303466796875, -0.3264617919921875, -0.31150054931640625, -0.296539306640625, -0.28157806396484375, -0.2666168212890625, -0.25165557861328125, -0.2366943359375, -0.22173309326171875, -0.2067718505859375, -0.19181060791015625, -0.176849365234375, -0.16188812255859375, -0.1469268798828125, -0.13196563720703125, -0.11700439453125, -0.10204315185546875, -0.0870819091796875, -0.07212066650390625, -0.057159423828125, -0.04219818115234375, -0.0272369384765625, -0.01227569580078125, 0.002685546875, 0.01764678955078125, 0.0326080322265625, 0.04756927490234375, 0.062530517578125, 0.07749176025390625, 0.0924530029296875, 0.10741424560546875, 0.12237548828125, 0.13733673095703125, 0.1522979736328125, 0.16725921630859375, 0.182220458984375, 0.19718170166015625, 0.2121429443359375, 0.22710418701171875, 0.2420654296875, 0.25702667236328125, 0.2719879150390625, 0.28694915771484375, 0.301910400390625, 0.31687164306640625, 0.3318328857421875, 0.34679412841796875, 0.36175537109375, 0.37671661376953125, 0.3916778564453125, 0.40663909912109375, 0.421600341796875, 0.43656158447265625, 0.4515228271484375, 0.46648406982421875, 0.4814453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 6.0, 11.0, 13.0, 10.0, 10.0, 19.0, 19.0, 19.0, 26.0, 27.0, 27.0, 35.0, 26.0, 52.0, 49.0, 46.0, 57.0, 48.0, 59.0, 50.0, 57.0, 37.0, 48.0, 47.0, 29.0, 32.0, 23.0, 23.0, 22.0, 14.0, 12.0, 9.0, 7.0, 5.0, 11.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001453399658203125, -0.0014071613550186157, -0.0013609230518341064, -0.0013146847486495972, -0.0012684464454650879, -0.0012222081422805786, -0.0011759698390960693, -0.00112973153591156, -0.0010834932327270508, -0.0010372549295425415, -0.0009910166263580322, -0.000944778323173523, -0.0008985400199890137, -0.0008523017168045044, -0.0008060634136199951, -0.0007598251104354858, -0.0007135868072509766, -0.0006673485040664673, -0.000621110200881958, -0.0005748718976974487, -0.0005286335945129395, -0.0004823952913284302, -0.0004361569881439209, -0.0003899186849594116, -0.00034368038177490234, -0.00029744207859039307, -0.0002512037754058838, -0.0002049654722213745, -0.00015872716903686523, -0.00011248886585235596, -6.625056266784668e-05, -2.0012259483337402e-05, 2.6226043701171875e-05, 7.246434688568115e-05, 0.00011870265007019043, 0.0001649409532546997, 0.00021117925643920898, 0.00025741755962371826, 0.00030365586280822754, 0.0003498941659927368, 0.0003961324691772461, 0.00044237077236175537, 0.0004886090755462646, 0.0005348473787307739, 0.0005810856819152832, 0.0006273239850997925, 0.0006735622882843018, 0.000719800591468811, 0.0007660388946533203, 0.0008122771978378296, 0.0008585155010223389, 0.0009047538042068481, 0.0009509921073913574, 0.0009972304105758667, 0.001043468713760376, 0.0010897070169448853, 0.0011359453201293945, 0.0011821836233139038, 0.001228421926498413, 0.0012746602296829224, 0.0013208985328674316, 0.001367136836051941, 0.0014133751392364502, 0.0014596134424209595, 0.0015058517456054688]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 1.0, 7.0, 9.0, 14.0, 18.0, 17.0, 21.0, 40.0, 53.0, 75.0, 121.0, 251.0, 613.0, 7625.0, 1035418.0, 3174.0, 521.0, 217.0, 105.0, 62.0, 50.0, 36.0, 18.0, 15.0, 20.0, 11.0, 10.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05255126953125, -0.05087900161743164, -0.04920673370361328, -0.04753446578979492, -0.04586219787597656, -0.0441899299621582, -0.042517662048339844, -0.040845394134521484, -0.039173126220703125, -0.037500858306884766, -0.035828590393066406, -0.03415632247924805, -0.03248405456542969, -0.030811786651611328, -0.02913951873779297, -0.02746725082397461, -0.02579498291015625, -0.02412271499633789, -0.02245044708251953, -0.020778179168701172, -0.019105911254882812, -0.017433643341064453, -0.015761375427246094, -0.014089107513427734, -0.012416839599609375, -0.010744571685791016, -0.009072303771972656, -0.007400035858154297, -0.0057277679443359375, -0.004055500030517578, -0.0023832321166992188, -0.0007109642028808594, 0.0009613037109375, 0.0026335716247558594, 0.004305839538574219, 0.005978107452392578, 0.0076503753662109375, 0.009322643280029297, 0.010994911193847656, 0.012667179107666016, 0.014339447021484375, 0.016011714935302734, 0.017683982849121094, 0.019356250762939453, 0.021028518676757812, 0.022700786590576172, 0.02437305450439453, 0.02604532241821289, 0.02771759033203125, 0.02938985824584961, 0.03106212615966797, 0.03273439407348633, 0.03440666198730469, 0.03607892990112305, 0.037751197814941406, 0.039423465728759766, 0.041095733642578125, 0.042768001556396484, 0.044440269470214844, 0.0461125373840332, 0.04778480529785156, 0.04945707321166992, 0.05112934112548828, 0.05280160903930664, 0.054473876953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1017.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044039469212293625, -0.003146381815895438, -0.001888816710561514, -0.0006312516052275896, 0.0006263135001063347, 0.0018838783726096153, 0.0031414437107741833, 0.004399009048938751, 0.005656573921442032, 0.0069141387939453125, 0.008171703666448593, 0.009429269470274448, 0.010686834342777729, 0.01194439921528101, 0.013201965019106865, 0.014459529891610146, 0.015717094764113426, 0.016974659636616707, 0.018232224509119987, 0.019489789381623268, 0.020747356116771698, 0.02200492098927498, 0.02326248586177826, 0.02452005073428154, 0.02577761560678482, 0.0270351804792881, 0.028292745351791382, 0.029550310224294662, 0.030807875096797943, 0.032065439969301224, 0.033323004841804504, 0.034580573439598083, 0.035838134586811066, 0.037095699459314346, 0.03835326433181763, 0.03961082920432091, 0.04086839407682419, 0.04212595894932747, 0.04338352382183075, 0.04464109241962433, 0.04589865356683731, 0.04715621843934059, 0.04841378331184387, 0.04967134818434715, 0.05092891305685043, 0.052186477929353714, 0.053444042801856995, 0.054701611399650574, 0.055959176272153854, 0.057216741144657135, 0.058474306017160416, 0.059731870889663696, 0.06098943576216698, 0.06224700063467026, 0.06350456923246384, 0.06476213037967682, 0.0660196989774704, 0.06727726757526398, 0.06853482872247696, 0.06979239732027054, 0.07104995846748352, 0.0723075270652771, 0.07356508821249008, 0.07482265681028366, 0.07608021795749664]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 20.0, 24.0, 28.0, 35.0, 44.0, 62.0, 61.0, 63.0, 74.0, 73.0, 73.0, 78.0, 61.0, 64.0, 58.0, 43.0, 40.0, 22.0, 25.0, 21.0, 9.0, 3.0, 11.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019169449806213379, -0.0018700174987316132, -0.0018230900168418884, -0.0017761625349521637, -0.001729235053062439, -0.0016823075711727142, -0.0016353800892829895, -0.0015884526073932648, -0.00154152512550354, -0.0014945976436138153, -0.0014476701617240906, -0.0014007426798343658, -0.0013538151979446411, -0.0013068877160549164, -0.0012599602341651917, -0.001213032752275467, -0.0011661052703857422, -0.0011191777884960175, -0.0010722503066062927, -0.001025322824716568, -0.0009783953428268433, -0.0009314678609371185, -0.0008845403790473938, -0.0008376128971576691, -0.0007906854152679443, -0.0007437579333782196, -0.0006968304514884949, -0.0006499029695987701, -0.0006029754877090454, -0.0005560480058193207, -0.000509120523929596, -0.0004621930420398712, -0.0004152655601501465, -0.00036833807826042175, -0.000321410596370697, -0.0002744831144809723, -0.00022755563259124756, -0.00018062815070152283, -0.0001337006688117981, -8.677318692207336e-05, -3.984570503234863e-05, 7.081776857376099e-06, 5.400925874710083e-05, 0.00010093674063682556, 0.0001478642225265503, 0.00019479170441627502, 0.00024171918630599976, 0.0002886466681957245, 0.0003355741500854492, 0.00038250163197517395, 0.0004294291138648987, 0.0004763565957546234, 0.0005232840776443481, 0.0005702115595340729, 0.0006171390414237976, 0.0006640665233135223, 0.0007109940052032471, 0.0007579214870929718, 0.0008048489689826965, 0.0008517764508724213, 0.000898703932762146, 0.0009456314146518707, 0.0009925588965415955, 0.0010394863784313202, 0.001086413860321045]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 9.0, 7.0, 3.0, 14.0, 12.0, 13.0, 15.0, 16.0, 27.0, 30.0, 37.0, 18.0, 31.0, 31.0, 38.0, 36.0, 49.0, 32.0, 24.0, 44.0, 39.0, 41.0, 44.0, 39.0, 42.0, 35.0, 35.0, 25.0, 27.0, 32.0, 14.0, 17.0, 22.0, 15.0, 17.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.7734375, -3.6500244140625, -3.526611328125, -3.4031982421875, -3.27978515625, -3.1563720703125, -3.032958984375, -2.9095458984375, -2.7861328125, -2.6627197265625, -2.539306640625, -2.4158935546875, -2.29248046875, -2.1690673828125, -2.045654296875, -1.9222412109375, -1.798828125, -1.6754150390625, -1.552001953125, -1.4285888671875, -1.30517578125, -1.1817626953125, -1.058349609375, -0.9349365234375, -0.8115234375, -0.6881103515625, -0.564697265625, -0.4412841796875, -0.31787109375, -0.1944580078125, -0.071044921875, 0.0523681640625, 0.17578125, 0.2991943359375, 0.422607421875, 0.5460205078125, 0.66943359375, 0.7928466796875, 0.916259765625, 1.0396728515625, 1.1630859375, 1.2864990234375, 1.409912109375, 1.5333251953125, 1.65673828125, 1.7801513671875, 1.903564453125, 2.0269775390625, 2.150390625, 2.2738037109375, 2.397216796875, 2.5206298828125, 2.64404296875, 2.7674560546875, 2.890869140625, 3.0142822265625, 3.1376953125, 3.2611083984375, 3.384521484375, 3.5079345703125, 3.63134765625, 3.7547607421875, 3.878173828125, 4.0015869140625, 4.125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 16.0, 21.0, 23.0, 43.0, 55.0, 91.0, 141.0, 214.0, 255.0, 449.0, 705.0, 1098.0, 1946.0, 3126.0, 5928.0, 11776.0, 26368.0, 71488.0, 283443.0, 472455.0, 102319.0, 34697.0, 14904.0, 7298.0, 3746.0, 2153.0, 1305.0, 834.0, 558.0, 362.0, 214.0, 167.0, 94.0, 75.0, 58.0, 27.0, 22.0, 24.0, 9.0, 13.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6015625, -4.4627685546875, -4.323974609375, -4.1851806640625, -4.04638671875, -3.9075927734375, -3.768798828125, -3.6300048828125, -3.4912109375, -3.3524169921875, -3.213623046875, -3.0748291015625, -2.93603515625, -2.7972412109375, -2.658447265625, -2.5196533203125, -2.380859375, -2.2420654296875, -2.103271484375, -1.9644775390625, -1.82568359375, -1.6868896484375, -1.548095703125, -1.4093017578125, -1.2705078125, -1.1317138671875, -0.992919921875, -0.8541259765625, -0.71533203125, -0.5765380859375, -0.437744140625, -0.2989501953125, -0.16015625, -0.0213623046875, 0.117431640625, 0.2562255859375, 0.39501953125, 0.5338134765625, 0.672607421875, 0.8114013671875, 0.9501953125, 1.0889892578125, 1.227783203125, 1.3665771484375, 1.50537109375, 1.6441650390625, 1.782958984375, 1.9217529296875, 2.060546875, 2.1993408203125, 2.338134765625, 2.4769287109375, 2.61572265625, 2.7545166015625, 2.893310546875, 3.0321044921875, 3.1708984375, 3.3096923828125, 3.448486328125, 3.5872802734375, 3.72607421875, 3.8648681640625, 4.003662109375, 4.1424560546875, 4.28125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 3.0, 7.0, 9.0, 10.0, 8.0, 14.0, 10.0, 18.0, 21.0, 24.0, 30.0, 36.0, 38.0, 43.0, 42.0, 43.0, 66.0, 106.0, 426.0, 1516.0, 112.0, 65.0, 51.0, 41.0, 40.0, 38.0, 38.0, 28.0, 22.0, 20.0, 15.0, 21.0, 16.0, 17.0, 8.0, 11.0, 8.0, 7.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4375, -14.9842529296875, -14.531005859375, -14.0777587890625, -13.62451171875, -13.1712646484375, -12.718017578125, -12.2647705078125, -11.8115234375, -11.3582763671875, -10.905029296875, -10.4517822265625, -9.99853515625, -9.5452880859375, -9.092041015625, -8.6387939453125, -8.185546875, -7.7322998046875, -7.279052734375, -6.8258056640625, -6.37255859375, -5.9193115234375, -5.466064453125, -5.0128173828125, -4.5595703125, -4.1063232421875, -3.653076171875, -3.1998291015625, -2.74658203125, -2.2933349609375, -1.840087890625, -1.3868408203125, -0.93359375, -0.4803466796875, -0.027099609375, 0.4261474609375, 0.87939453125, 1.3326416015625, 1.785888671875, 2.2391357421875, 2.6923828125, 3.1456298828125, 3.598876953125, 4.0521240234375, 4.50537109375, 4.9586181640625, 5.411865234375, 5.8651123046875, 6.318359375, 6.7716064453125, 7.224853515625, 7.6781005859375, 8.13134765625, 8.5845947265625, 9.037841796875, 9.4910888671875, 9.9443359375, 10.3975830078125, 10.850830078125, 11.3040771484375, 11.75732421875, 12.2105712890625, 12.663818359375, 13.1170654296875, 13.5703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 13.0, 15.0, 18.0, 18.0, 34.0, 35.0, 34.0, 60.0, 106.0, 183.0, 296.0, 663.0, 5228.0, 2771982.0, 362797.0, 2875.0, 590.0, 282.0, 140.0, 112.0, 62.0, 42.0, 22.0, 28.0, 17.0, 13.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.1875, -31.998046875, -30.80859375, -29.619140625, -28.4296875, -27.240234375, -26.05078125, -24.861328125, -23.671875, -22.482421875, -21.29296875, -20.103515625, -18.9140625, -17.724609375, -16.53515625, -15.345703125, -14.15625, -12.966796875, -11.77734375, -10.587890625, -9.3984375, -8.208984375, -7.01953125, -5.830078125, -4.640625, -3.451171875, -2.26171875, -1.072265625, 0.1171875, 1.306640625, 2.49609375, 3.685546875, 4.875, 6.064453125, 7.25390625, 8.443359375, 9.6328125, 10.822265625, 12.01171875, 13.201171875, 14.390625, 15.580078125, 16.76953125, 17.958984375, 19.1484375, 20.337890625, 21.52734375, 22.716796875, 23.90625, 25.095703125, 26.28515625, 27.474609375, 28.6640625, 29.853515625, 31.04296875, 32.232421875, 33.421875, 34.611328125, 35.80078125, 36.990234375, 38.1796875, 39.369140625, 40.55859375, 41.748046875, 42.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 11.0, 108.0, 326.0, 384.0, 154.0, 25.0, 6.0], "bins": [-116.4489974975586, -114.5123062133789, -112.57561492919922, -110.63893127441406, -108.70223999023438, -106.76554870605469, -104.828857421875, -102.89217376708984, -100.95548248291016, -99.01879119873047, -97.08209991455078, -95.14541625976562, -93.20872497558594, -91.27203369140625, -89.33534240722656, -87.3986587524414, -85.46196746826172, -83.52527618408203, -81.58858489990234, -79.65190124511719, -77.7152099609375, -75.77851867675781, -73.84182739257812, -71.90514373779297, -69.96845245361328, -68.0317611694336, -66.0950698852539, -64.15838623046875, -62.22169494628906, -60.285003662109375, -58.34831619262695, -56.411624908447266, -54.474937438964844, -52.538246154785156, -50.601558685302734, -48.66486740112305, -46.728179931640625, -44.79148864746094, -42.854801177978516, -40.91810989379883, -38.98141860961914, -37.04472732543945, -35.10803985595703, -33.171348571777344, -31.234661102294922, -29.297969818115234, -27.361282348632812, -25.424591064453125, -23.487903594970703, -21.55121421813965, -19.614524841308594, -17.67783546447754, -15.741146087646484, -13.804455757141113, -11.867766380310059, -9.931077003479004, -7.994387626647949, -6.0576982498168945, -4.12100887298584, -2.184319019317627, -0.24762964248657227, 1.6890602111816406, 3.6257495880126953, 5.56243896484375, 7.499128341674805]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 8.0, 12.0, 14.0, 13.0, 14.0, 21.0, 23.0, 18.0, 24.0, 19.0, 28.0, 34.0, 38.0, 39.0, 31.0, 27.0, 44.0, 30.0, 42.0, 47.0, 37.0, 41.0, 26.0, 36.0, 42.0, 27.0, 25.0, 27.0, 26.0, 19.0, 17.0, 18.0, 21.0, 13.0, 14.0, 13.0, 10.0, 10.0, 11.0, 7.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-38.564788818359375, -37.33913040161133, -36.113468170166016, -34.88780975341797, -33.66215133666992, -32.436492919921875, -31.210830688476562, -29.985172271728516, -28.759511947631836, -27.533851623535156, -26.30819320678711, -25.08253288269043, -23.85687255859375, -22.631214141845703, -21.405553817749023, -20.179893493652344, -18.954235076904297, -17.728574752807617, -16.50291633605957, -15.27725601196289, -14.051596641540527, -12.825937271118164, -11.600276947021484, -10.374617576599121, -9.148958206176758, -7.9232988357543945, -6.697638988494873, -5.471979141235352, -4.246319770812988, -3.020660400390625, -1.7950005531311035, -0.569340705871582, 0.6563224792480469, 1.8819820880889893, 3.1076416969299316, 4.333301544189453, 5.558960914611816, 6.78462028503418, 8.01028060913086, 9.235939979553223, 10.461599349975586, 11.68725872039795, 12.912918090820312, 14.138578414916992, 15.364237785339355, 16.58989715576172, 17.8155574798584, 19.041217803955078, 20.266876220703125, 21.492536544799805, 22.71819496154785, 23.94385528564453, 25.169513702392578, 26.395174026489258, 27.620834350585938, 28.846492767333984, 30.072153091430664, 31.297813415527344, 32.52347183227539, 33.74913024902344, 34.97479248046875, 36.2004508972168, 37.426109313964844, 38.651771545410156, 39.8774299621582]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 9.0, 5.0, 10.0, 16.0, 19.0, 15.0, 26.0, 23.0, 29.0, 31.0, 30.0, 30.0, 26.0, 44.0, 40.0, 47.0, 32.0, 31.0, 39.0, 34.0, 48.0, 45.0, 41.0, 34.0, 30.0, 32.0, 27.0, 30.0, 27.0, 16.0, 15.0, 18.0, 18.0, 9.0, 11.0, 9.0, 8.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.828125, -3.7001953125, -3.572265625, -3.4443359375, -3.31640625, -3.1884765625, -3.060546875, -2.9326171875, -2.8046875, -2.6767578125, -2.548828125, -2.4208984375, -2.29296875, -2.1650390625, -2.037109375, -1.9091796875, -1.78125, -1.6533203125, -1.525390625, -1.3974609375, -1.26953125, -1.1416015625, -1.013671875, -0.8857421875, -0.7578125, -0.6298828125, -0.501953125, -0.3740234375, -0.24609375, -0.1181640625, 0.009765625, 0.1376953125, 0.265625, 0.3935546875, 0.521484375, 0.6494140625, 0.77734375, 0.9052734375, 1.033203125, 1.1611328125, 1.2890625, 1.4169921875, 1.544921875, 1.6728515625, 1.80078125, 1.9287109375, 2.056640625, 2.1845703125, 2.3125, 2.4404296875, 2.568359375, 2.6962890625, 2.82421875, 2.9521484375, 3.080078125, 3.2080078125, 3.3359375, 3.4638671875, 3.591796875, 3.7197265625, 3.84765625, 3.9755859375, 4.103515625, 4.2314453125, 4.359375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 5.0, 14.0, 12.0, 22.0, 33.0, 36.0, 60.0, 94.0, 122.0, 233.0, 357.0, 623.0, 1166.0, 2037.0, 3913.0, 7713.0, 16157.0, 38373.0, 105833.0, 350384.0, 1036272.0, 1471909.0, 778856.0, 246066.0, 77810.0, 29637.0, 13104.0, 6232.0, 3157.0, 1617.0, 977.0, 513.0, 364.0, 188.0, 119.0, 82.0, 54.0, 45.0, 29.0, 21.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4921875, -4.333740234375, -4.17529296875, -4.016845703125, -3.8583984375, -3.699951171875, -3.54150390625, -3.383056640625, -3.224609375, -3.066162109375, -2.90771484375, -2.749267578125, -2.5908203125, -2.432373046875, -2.27392578125, -2.115478515625, -1.95703125, -1.798583984375, -1.64013671875, -1.481689453125, -1.3232421875, -1.164794921875, -1.00634765625, -0.847900390625, -0.689453125, -0.531005859375, -0.37255859375, -0.214111328125, -0.0556640625, 0.102783203125, 0.26123046875, 0.419677734375, 0.578125, 0.736572265625, 0.89501953125, 1.053466796875, 1.2119140625, 1.370361328125, 1.52880859375, 1.687255859375, 1.845703125, 2.004150390625, 2.16259765625, 2.321044921875, 2.4794921875, 2.637939453125, 2.79638671875, 2.954833984375, 3.11328125, 3.271728515625, 3.43017578125, 3.588623046875, 3.7470703125, 3.905517578125, 4.06396484375, 4.222412109375, 4.380859375, 4.539306640625, 4.69775390625, 4.856201171875, 5.0146484375, 5.173095703125, 5.33154296875, 5.489990234375, 5.6484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 4.0, 11.0, 19.0, 7.0, 22.0, 32.0, 32.0, 49.0, 82.0, 86.0, 111.0, 180.0, 217.0, 270.0, 346.0, 433.0, 439.0, 428.0, 327.0, 231.0, 196.0, 133.0, 104.0, 102.0, 64.0, 29.0, 38.0, 19.0, 19.0, 11.0, 10.0, 7.0, 7.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.1788330078125, -13.826416015625, -13.4739990234375, -13.12158203125, -12.7691650390625, -12.416748046875, -12.0643310546875, -11.7119140625, -11.3594970703125, -11.007080078125, -10.6546630859375, -10.30224609375, -9.9498291015625, -9.597412109375, -9.2449951171875, -8.892578125, -8.5401611328125, -8.187744140625, -7.8353271484375, -7.48291015625, -7.1304931640625, -6.778076171875, -6.4256591796875, -6.0732421875, -5.7208251953125, -5.368408203125, -5.0159912109375, -4.66357421875, -4.3111572265625, -3.958740234375, -3.6063232421875, -3.25390625, -2.9014892578125, -2.549072265625, -2.1966552734375, -1.84423828125, -1.4918212890625, -1.139404296875, -0.7869873046875, -0.4345703125, -0.0821533203125, 0.270263671875, 0.6226806640625, 0.97509765625, 1.3275146484375, 1.679931640625, 2.0323486328125, 2.384765625, 2.7371826171875, 3.089599609375, 3.4420166015625, 3.79443359375, 4.1468505859375, 4.499267578125, 4.8516845703125, 5.2041015625, 5.5565185546875, 5.908935546875, 6.2613525390625, 6.61376953125, 6.9661865234375, 7.318603515625, 7.6710205078125, 8.0234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 15.0, 8.0, 15.0, 30.0, 36.0, 56.0, 53.0, 92.0, 132.0, 179.0, 394.0, 1002.0, 7275.0, 362465.0, 3756325.0, 61857.0, 2802.0, 673.0, 287.0, 157.0, 95.0, 88.0, 50.0, 42.0, 31.0, 26.0, 16.0, 18.0, 15.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.5, -29.294921875, -28.08984375, -26.884765625, -25.6796875, -24.474609375, -23.26953125, -22.064453125, -20.859375, -19.654296875, -18.44921875, -17.244140625, -16.0390625, -14.833984375, -13.62890625, -12.423828125, -11.21875, -10.013671875, -8.80859375, -7.603515625, -6.3984375, -5.193359375, -3.98828125, -2.783203125, -1.578125, -0.373046875, 0.83203125, 2.037109375, 3.2421875, 4.447265625, 5.65234375, 6.857421875, 8.0625, 9.267578125, 10.47265625, 11.677734375, 12.8828125, 14.087890625, 15.29296875, 16.498046875, 17.703125, 18.908203125, 20.11328125, 21.318359375, 22.5234375, 23.728515625, 24.93359375, 26.138671875, 27.34375, 28.548828125, 29.75390625, 30.958984375, 32.1640625, 33.369140625, 34.57421875, 35.779296875, 36.984375, 38.189453125, 39.39453125, 40.599609375, 41.8046875, 43.009765625, 44.21484375, 45.419921875, 46.625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 14.0, 43.0, 101.0, 140.0, 186.0, 222.0, 157.0, 86.0, 32.0, 18.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.33330535888672, -121.43858337402344, -118.54386901855469, -115.6491470336914, -112.75443267822266, -109.85971069335938, -106.96499633789062, -104.07027435302734, -101.17555236816406, -98.28083038330078, -95.38611602783203, -92.49139404296875, -89.5966796875, -86.70195770263672, -83.80723571777344, -80.91252136230469, -78.01780700683594, -75.12308502197266, -72.2283706665039, -69.33364868164062, -66.43893432617188, -63.544212341308594, -60.64949417114258, -57.75477600097656, -54.86005783081055, -51.96533966064453, -49.070621490478516, -46.1759033203125, -43.28118133544922, -40.38646697998047, -37.49174499511719, -34.59702682495117, -31.702301025390625, -28.80758285522461, -25.912864685058594, -23.018144607543945, -20.12342643737793, -17.228708267211914, -14.333988189697266, -11.43927001953125, -8.544551849365234, -5.6498332023620605, -2.7551145553588867, 0.1396045684814453, 3.034322738647461, 5.929040908813477, 8.823760986328125, 11.71847915649414, 14.613197326660156, 17.507915496826172, 20.402633666992188, 23.297353744506836, 26.19207191467285, 29.086790084838867, 31.981510162353516, 34.87622833251953, 37.77094650268555, 40.66566467285156, 43.56038284301758, 46.455101013183594, 49.349822998046875, 52.244537353515625, 55.139259338378906, 58.03397750854492, 60.92869567871094]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 3.0, 7.0, 9.0, 21.0, 13.0, 25.0, 21.0, 19.0, 28.0, 27.0, 27.0, 34.0, 28.0, 52.0, 51.0, 43.0, 34.0, 45.0, 36.0, 39.0, 52.0, 43.0, 29.0, 31.0, 23.0, 28.0, 27.0, 23.0, 23.0, 21.0, 20.0, 19.0, 13.0, 12.0, 10.0, 9.0, 14.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.26957702636719, -39.09467315673828, -37.91977310180664, -36.744869232177734, -35.56996536254883, -34.39506530761719, -33.22016143798828, -32.045257568359375, -30.870357513427734, -29.69545555114746, -28.520551681518555, -27.34564971923828, -26.170747756958008, -24.995845794677734, -23.820941925048828, -22.646039962768555, -21.47113609313965, -20.296234130859375, -19.12133026123047, -17.946428298950195, -16.771526336669922, -15.596623420715332, -14.421720504760742, -13.246818542480469, -12.071915626525879, -10.897012710571289, -9.722110748291016, -8.547207832336426, -7.372305393218994, -6.1974029541015625, -5.022500038146973, -3.847598075866699, -2.6726951599121094, -1.4977926015853882, -0.322890043258667, 0.8520126342773438, 2.0269150733947754, 3.201817512512207, 4.376720428466797, 5.55162239074707, 6.72652530670166, 7.901427745819092, 9.076330184936523, 10.251233100891113, 11.426136016845703, 12.601037979125977, 13.775940895080566, 14.95084285736084, 16.12574577331543, 17.300647735595703, 18.47555160522461, 19.650453567504883, 20.825355529785156, 22.000259399414062, 23.175161361694336, 24.35006332397461, 25.524967193603516, 26.69986915588379, 27.874773025512695, 29.04967498779297, 30.224576950073242, 31.399478912353516, 32.57438278198242, 33.74928283691406, 34.92418670654297]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 23.0, 21.0, 16.0, 32.0, 31.0, 39.0, 37.0, 32.0, 41.0, 41.0, 36.0, 41.0, 36.0, 40.0, 53.0, 48.0, 46.0, 35.0, 39.0, 26.0, 29.0, 28.0, 25.0, 27.0, 23.0, 12.0, 18.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 5.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6328125, -4.49237060546875, -4.3519287109375, -4.21148681640625, -4.071044921875, -3.93060302734375, -3.7901611328125, -3.64971923828125, -3.50927734375, -3.36883544921875, -3.2283935546875, -3.08795166015625, -2.947509765625, -2.80706787109375, -2.6666259765625, -2.52618408203125, -2.3857421875, -2.24530029296875, -2.1048583984375, -1.96441650390625, -1.823974609375, -1.68353271484375, -1.5430908203125, -1.40264892578125, -1.26220703125, -1.12176513671875, -0.9813232421875, -0.84088134765625, -0.700439453125, -0.55999755859375, -0.4195556640625, -0.27911376953125, -0.138671875, 0.00177001953125, 0.1422119140625, 0.28265380859375, 0.423095703125, 0.56353759765625, 0.7039794921875, 0.84442138671875, 0.98486328125, 1.12530517578125, 1.2657470703125, 1.40618896484375, 1.546630859375, 1.68707275390625, 1.8275146484375, 1.96795654296875, 2.1083984375, 2.24884033203125, 2.3892822265625, 2.52972412109375, 2.670166015625, 2.81060791015625, 2.9510498046875, 3.09149169921875, 3.23193359375, 3.37237548828125, 3.5128173828125, 3.65325927734375, 3.793701171875, 3.93414306640625, 4.0745849609375, 4.21502685546875, 4.35546875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 9.0, 19.0, 18.0, 26.0, 55.0, 57.0, 90.0, 145.0, 196.0, 284.0, 420.0, 642.0, 963.0, 1486.0, 2241.0, 3466.0, 5306.0, 8558.0, 13740.0, 22919.0, 39726.0, 73817.0, 147739.0, 262486.0, 217486.0, 109624.0, 56075.0, 31518.0, 18610.0, 10879.0, 7126.0, 4385.0, 2860.0, 1918.0, 1204.0, 795.0, 536.0, 344.0, 246.0, 174.0, 126.0, 62.0, 62.0, 35.0, 25.0, 19.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 3.0], "bins": [-0.77490234375, -0.7519683837890625, -0.729034423828125, -0.7061004638671875, -0.68316650390625, -0.6602325439453125, -0.637298583984375, -0.6143646240234375, -0.5914306640625, -0.5684967041015625, -0.545562744140625, -0.5226287841796875, -0.49969482421875, -0.4767608642578125, -0.453826904296875, -0.4308929443359375, -0.407958984375, -0.3850250244140625, -0.362091064453125, -0.3391571044921875, -0.31622314453125, -0.2932891845703125, -0.270355224609375, -0.2474212646484375, -0.2244873046875, -0.2015533447265625, -0.178619384765625, -0.1556854248046875, -0.13275146484375, -0.1098175048828125, -0.086883544921875, -0.0639495849609375, -0.041015625, -0.0180816650390625, 0.004852294921875, 0.0277862548828125, 0.05072021484375, 0.0736541748046875, 0.096588134765625, 0.1195220947265625, 0.1424560546875, 0.1653900146484375, 0.188323974609375, 0.2112579345703125, 0.23419189453125, 0.2571258544921875, 0.280059814453125, 0.3029937744140625, 0.325927734375, 0.3488616943359375, 0.371795654296875, 0.3947296142578125, 0.41766357421875, 0.4405975341796875, 0.463531494140625, 0.4864654541015625, 0.5093994140625, 0.5323333740234375, 0.555267333984375, 0.5782012939453125, 0.60113525390625, 0.6240692138671875, 0.647003173828125, 0.6699371337890625, 0.69287109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 11.0, 7.0, 10.0, 13.0, 16.0, 15.0, 18.0, 22.0, 30.0, 35.0, 29.0, 36.0, 34.0, 36.0, 49.0, 41.0, 45.0, 1080.0, 40.0, 38.0, 47.0, 27.0, 30.0, 46.0, 33.0, 25.0, 37.0, 34.0, 17.0, 15.0, 21.0, 8.0, 19.0, 10.0, 8.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.982421875, -2.89306640625, -2.8037109375, -2.71435546875, -2.625, -2.53564453125, -2.4462890625, -2.35693359375, -2.267578125, -2.17822265625, -2.0888671875, -1.99951171875, -1.91015625, -1.82080078125, -1.7314453125, -1.64208984375, -1.552734375, -1.46337890625, -1.3740234375, -1.28466796875, -1.1953125, -1.10595703125, -1.0166015625, -0.92724609375, -0.837890625, -0.74853515625, -0.6591796875, -0.56982421875, -0.48046875, -0.39111328125, -0.3017578125, -0.21240234375, -0.123046875, -0.03369140625, 0.0556640625, 0.14501953125, 0.234375, 0.32373046875, 0.4130859375, 0.50244140625, 0.591796875, 0.68115234375, 0.7705078125, 0.85986328125, 0.94921875, 1.03857421875, 1.1279296875, 1.21728515625, 1.306640625, 1.39599609375, 1.4853515625, 1.57470703125, 1.6640625, 1.75341796875, 1.8427734375, 1.93212890625, 2.021484375, 2.11083984375, 2.2001953125, 2.28955078125, 2.37890625, 2.46826171875, 2.5576171875, 2.64697265625, 2.736328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 6.0, 5.0, 8.0, 13.0, 19.0, 52.0, 65.0, 92.0, 154.0, 238.0, 422.0, 658.0, 1061.0, 1618.0, 2671.0, 4369.0, 7124.0, 11835.0, 20940.0, 36303.0, 65758.0, 124433.0, 218374.0, 1279643.0, 144616.0, 76684.0, 41656.0, 23772.0, 13642.0, 8091.0, 4941.0, 2977.0, 1839.0, 1120.0, 732.0, 443.0, 272.0, 172.0, 117.0, 70.0, 60.0, 19.0, 20.0, 10.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.506195068359375, -0.48992919921875, -0.473663330078125, -0.4573974609375, -0.441131591796875, -0.42486572265625, -0.408599853515625, -0.392333984375, -0.376068115234375, -0.35980224609375, -0.343536376953125, -0.3272705078125, -0.311004638671875, -0.29473876953125, -0.278472900390625, -0.26220703125, -0.245941162109375, -0.22967529296875, -0.213409423828125, -0.1971435546875, -0.180877685546875, -0.16461181640625, -0.148345947265625, -0.132080078125, -0.115814208984375, -0.09954833984375, -0.083282470703125, -0.0670166015625, -0.050750732421875, -0.03448486328125, -0.018218994140625, -0.001953125, 0.014312744140625, 0.03057861328125, 0.046844482421875, 0.0631103515625, 0.079376220703125, 0.09564208984375, 0.111907958984375, 0.128173828125, 0.144439697265625, 0.16070556640625, 0.176971435546875, 0.1932373046875, 0.209503173828125, 0.22576904296875, 0.242034912109375, 0.25830078125, 0.274566650390625, 0.29083251953125, 0.307098388671875, 0.3233642578125, 0.339630126953125, 0.35589599609375, 0.372161865234375, 0.388427734375, 0.404693603515625, 0.42095947265625, 0.437225341796875, 0.4534912109375, 0.469757080078125, 0.48602294921875, 0.502288818359375, 0.5185546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 2.0, 7.0, 10.0, 15.0, 15.0, 23.0, 27.0, 38.0, 46.0, 50.0, 77.0, 76.0, 73.0, 71.0, 82.0, 65.0, 71.0, 52.0, 32.0, 38.0, 24.0, 30.0, 15.0, 14.0, 10.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00278472900390625, -0.002713307738304138, -0.0026418864727020264, -0.0025704652070999146, -0.0024990439414978027, -0.002427622675895691, -0.002356201410293579, -0.0022847801446914673, -0.0022133588790893555, -0.0021419376134872437, -0.002070516347885132, -0.00199909508228302, -0.0019276738166809082, -0.0018562525510787964, -0.0017848312854766846, -0.0017134100198745728, -0.001641988754272461, -0.0015705674886703491, -0.0014991462230682373, -0.0014277249574661255, -0.0013563036918640137, -0.0012848824262619019, -0.00121346116065979, -0.0011420398950576782, -0.0010706186294555664, -0.0009991973638534546, -0.0009277760982513428, -0.000856354832649231, -0.0007849335670471191, -0.0007135123014450073, -0.0006420910358428955, -0.0005706697702407837, -0.0004992485046386719, -0.00042782723903656006, -0.00035640597343444824, -0.0002849847078323364, -0.0002135634422302246, -0.0001421421766281128, -7.072091102600098e-05, 7.003545761108398e-07, 7.212162017822266e-05, 0.00014354288578033447, 0.0002149641513824463, 0.0002863854169845581, 0.0003578066825866699, 0.00042922794818878174, 0.0005006492137908936, 0.0005720704793930054, 0.0006434917449951172, 0.000714913010597229, 0.0007863342761993408, 0.0008577555418014526, 0.0009291768074035645, 0.0010005980730056763, 0.001072019338607788, 0.0011434406042099, 0.0012148618698120117, 0.0012862831354141235, 0.0013577044010162354, 0.0014291256666183472, 0.001500546932220459, 0.0015719681978225708, 0.0016433894634246826, 0.0017148107290267944, 0.0017862319946289062]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 1.0, 16.0, 16.0, 27.0, 39.0, 56.0, 65.0, 135.0, 298.0, 935.0, 413221.0, 632027.0, 1023.0, 316.0, 133.0, 79.0, 46.0, 28.0, 22.0, 18.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055633544921875, -0.05341005325317383, -0.051186561584472656, -0.048963069915771484, -0.04673957824707031, -0.04451608657836914, -0.04229259490966797, -0.0400691032409668, -0.037845611572265625, -0.03562211990356445, -0.03339862823486328, -0.03117513656616211, -0.028951644897460938, -0.026728153228759766, -0.024504661560058594, -0.022281169891357422, -0.02005767822265625, -0.017834186553955078, -0.015610694885253906, -0.013387203216552734, -0.011163711547851562, -0.00894021987915039, -0.006716728210449219, -0.004493236541748047, -0.002269744873046875, -4.6253204345703125e-05, 0.0021772384643554688, 0.004400730133056641, 0.0066242218017578125, 0.008847713470458984, 0.011071205139160156, 0.013294696807861328, 0.0155181884765625, 0.017741680145263672, 0.019965171813964844, 0.022188663482666016, 0.024412155151367188, 0.02663564682006836, 0.02885913848876953, 0.031082630157470703, 0.033306121826171875, 0.03552961349487305, 0.03775310516357422, 0.03997659683227539, 0.04220008850097656, 0.044423580169677734, 0.046647071838378906, 0.04887056350708008, 0.05109405517578125, 0.05331754684448242, 0.055541038513183594, 0.057764530181884766, 0.05998802185058594, 0.06221151351928711, 0.06443500518798828, 0.06665849685668945, 0.06888198852539062, 0.0711054801940918, 0.07332897186279297, 0.07555246353149414, 0.07777595520019531, 0.07999944686889648, 0.08222293853759766, 0.08444643020629883, 0.086669921875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 12.0, 1007.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009045690298080444, -0.007335582748055458, -0.005625475198030472, -0.0039153676480054855, -0.0022052600979804993, -0.000495152547955513, 0.0012149550020694733, 0.0029250625520944595, 0.004635170102119446, 0.006345277652144432, 0.008055385202169418, 0.009765492752194405, 0.011475600302219391, 0.013185707852244377, 0.014895815402269363, 0.01660592295229435, 0.018316030502319336, 0.020026138052344322, 0.02173624560236931, 0.023446353152394295, 0.02515646070241928, 0.026866568252444267, 0.028576675802469254, 0.03028678335249424, 0.031996890902519226, 0.03370700031518936, 0.0354171060025692, 0.037127211689949036, 0.03883732110261917, 0.04054743051528931, 0.042257536202669144, 0.04396764189004898, 0.045677751302719116, 0.04738786071538925, 0.04909796640276909, 0.050808072090148926, 0.05251818150281906, 0.0542282909154892, 0.055938396602869034, 0.05764850229024887, 0.059358611702919006, 0.06106872111558914, 0.06277883052825928, 0.06448893249034882, 0.06619904190301895, 0.06790915131568909, 0.06961925327777863, 0.07132936269044876, 0.0730394721031189, 0.07474958151578903, 0.07645969092845917, 0.0781697928905487, 0.07987990230321884, 0.08159001171588898, 0.08330011367797852, 0.08501022309064865, 0.08672033250331879, 0.08843044191598892, 0.09014055132865906, 0.0918506532907486, 0.09356076270341873, 0.09527087211608887, 0.0969809740781784, 0.09869108349084854, 0.10040119290351868]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 9.0, 14.0, 21.0, 39.0, 34.0, 55.0, 72.0, 63.0, 80.0, 76.0, 71.0, 87.0, 80.0, 68.0, 58.0, 43.0, 45.0, 19.0, 19.0, 23.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025292038917541504, -0.0024705110117793083, -0.0024118181318044662, -0.002353125251829624, -0.002294432371854782, -0.00223573949187994, -0.002177046611905098, -0.002118353731930256, -0.002059660851955414, -0.0020009679719805717, -0.0019422750920057297, -0.0018835822120308876, -0.0018248893320560455, -0.0017661964520812035, -0.0017075035721063614, -0.0016488106921315193, -0.0015901178121566772, -0.0015314249321818352, -0.001472732052206993, -0.001414039172232151, -0.001355346292257309, -0.0012966534122824669, -0.0012379605323076248, -0.0011792676523327827, -0.0011205747723579407, -0.0010618818923830986, -0.0010031890124082565, -0.0009444961324334145, -0.0008858032524585724, -0.0008271103724837303, -0.0007684174925088882, -0.0007097246125340462, -0.0006510317325592041, -0.000592338852584362, -0.00053364597260952, -0.0004749530926346779, -0.0004162602126598358, -0.00035756733268499374, -0.00029887445271015167, -0.0002401815727353096, -0.00018148869276046753, -0.00012279581278562546, -6.410293281078339e-05, -5.410052835941315e-06, 5.328282713890076e-05, 0.00011197570711374283, 0.0001706685870885849, 0.00022936146706342697, 0.00028805434703826904, 0.0003467472270131111, 0.0004054401069879532, 0.00046413298696279526, 0.0005228258669376373, 0.0005815187469124794, 0.0006402116268873215, 0.0006989045068621635, 0.0007575973868370056, 0.0008162902668118477, 0.0008749831467866898, 0.0009336760267615318, 0.000992368906736374, 0.001051061786711216, 0.001109754666686058, 0.0011684475466609001, 0.0012271404266357422]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 23.0, 21.0, 16.0, 32.0, 31.0, 39.0, 37.0, 32.0, 41.0, 41.0, 36.0, 41.0, 36.0, 40.0, 53.0, 48.0, 46.0, 35.0, 39.0, 26.0, 29.0, 28.0, 25.0, 27.0, 23.0, 12.0, 18.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 5.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6328125, -4.49237060546875, -4.3519287109375, -4.21148681640625, -4.071044921875, -3.93060302734375, -3.7901611328125, -3.64971923828125, -3.50927734375, -3.36883544921875, -3.2283935546875, -3.08795166015625, -2.947509765625, -2.80706787109375, -2.6666259765625, -2.52618408203125, -2.3857421875, -2.24530029296875, -2.1048583984375, -1.96441650390625, -1.823974609375, -1.68353271484375, -1.5430908203125, -1.40264892578125, -1.26220703125, -1.12176513671875, -0.9813232421875, -0.84088134765625, -0.700439453125, -0.55999755859375, -0.4195556640625, -0.27911376953125, -0.138671875, 0.00177001953125, 0.1422119140625, 0.28265380859375, 0.423095703125, 0.56353759765625, 0.7039794921875, 0.84442138671875, 0.98486328125, 1.12530517578125, 1.2657470703125, 1.40618896484375, 1.546630859375, 1.68707275390625, 1.8275146484375, 1.96795654296875, 2.1083984375, 2.24884033203125, 2.3892822265625, 2.52972412109375, 2.670166015625, 2.81060791015625, 2.9510498046875, 3.09149169921875, 3.23193359375, 3.37237548828125, 3.5128173828125, 3.65325927734375, 3.793701171875, 3.93414306640625, 4.0745849609375, 4.21502685546875, 4.35546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 6.0, 17.0, 22.0, 34.0, 39.0, 77.0, 92.0, 137.0, 245.0, 358.0, 546.0, 913.0, 1488.0, 2511.0, 4113.0, 7532.0, 15574.0, 37017.0, 110044.0, 404714.0, 317147.0, 86416.0, 30234.0, 13097.0, 6696.0, 3677.0, 2143.0, 1346.0, 807.0, 522.0, 310.0, 210.0, 172.0, 92.0, 79.0, 30.0, 18.0, 22.0, 7.0, 12.0, 10.0, 10.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.762969970703125, -3.64117431640625, -3.519378662109375, -3.3975830078125, -3.275787353515625, -3.15399169921875, -3.032196044921875, -2.910400390625, -2.788604736328125, -2.66680908203125, -2.545013427734375, -2.4232177734375, -2.301422119140625, -2.17962646484375, -2.057830810546875, -1.93603515625, -1.814239501953125, -1.69244384765625, -1.570648193359375, -1.4488525390625, -1.327056884765625, -1.20526123046875, -1.083465576171875, -0.961669921875, -0.839874267578125, -0.71807861328125, -0.596282958984375, -0.4744873046875, -0.352691650390625, -0.23089599609375, -0.109100341796875, 0.0126953125, 0.134490966796875, 0.25628662109375, 0.378082275390625, 0.4998779296875, 0.621673583984375, 0.74346923828125, 0.865264892578125, 0.987060546875, 1.108856201171875, 1.23065185546875, 1.352447509765625, 1.4742431640625, 1.596038818359375, 1.71783447265625, 1.839630126953125, 1.96142578125, 2.083221435546875, 2.20501708984375, 2.326812744140625, 2.4486083984375, 2.570404052734375, 2.69219970703125, 2.813995361328125, 2.935791015625, 3.057586669921875, 3.17938232421875, 3.301177978515625, 3.4229736328125, 3.544769287109375, 3.66656494140625, 3.788360595703125, 3.91015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 9.0, 13.0, 15.0, 11.0, 22.0, 23.0, 23.0, 31.0, 40.0, 34.0, 33.0, 47.0, 43.0, 66.0, 83.0, 275.0, 1651.0, 167.0, 60.0, 68.0, 41.0, 37.0, 28.0, 28.0, 32.0, 27.0, 22.0, 23.0, 16.0, 15.0, 12.0, 12.0, 3.0, 0.0, 7.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.88525390625, -17.3642578125, -16.84326171875, -16.322265625, -15.80126953125, -15.2802734375, -14.75927734375, -14.23828125, -13.71728515625, -13.1962890625, -12.67529296875, -12.154296875, -11.63330078125, -11.1123046875, -10.59130859375, -10.0703125, -9.54931640625, -9.0283203125, -8.50732421875, -7.986328125, -7.46533203125, -6.9443359375, -6.42333984375, -5.90234375, -5.38134765625, -4.8603515625, -4.33935546875, -3.818359375, -3.29736328125, -2.7763671875, -2.25537109375, -1.734375, -1.21337890625, -0.6923828125, -0.17138671875, 0.349609375, 0.87060546875, 1.3916015625, 1.91259765625, 2.43359375, 2.95458984375, 3.4755859375, 3.99658203125, 4.517578125, 5.03857421875, 5.5595703125, 6.08056640625, 6.6015625, 7.12255859375, 7.6435546875, 8.16455078125, 8.685546875, 9.20654296875, 9.7275390625, 10.24853515625, 10.76953125, 11.29052734375, 11.8115234375, 12.33251953125, 12.853515625, 13.37451171875, 13.8955078125, 14.41650390625, 14.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 12.0, 14.0, 15.0, 25.0, 30.0, 25.0, 30.0, 64.0, 49.0, 103.0, 123.0, 175.0, 291.0, 501.0, 2820.0, 341875.0, 2792083.0, 5631.0, 688.0, 333.0, 185.0, 149.0, 115.0, 81.0, 52.0, 46.0, 33.0, 32.0, 18.0, 21.0, 21.0, 9.0, 11.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.5, -28.45068359375, -27.4013671875, -26.35205078125, -25.302734375, -24.25341796875, -23.2041015625, -22.15478515625, -21.10546875, -20.05615234375, -19.0068359375, -17.95751953125, -16.908203125, -15.85888671875, -14.8095703125, -13.76025390625, -12.7109375, -11.66162109375, -10.6123046875, -9.56298828125, -8.513671875, -7.46435546875, -6.4150390625, -5.36572265625, -4.31640625, -3.26708984375, -2.2177734375, -1.16845703125, -0.119140625, 0.93017578125, 1.9794921875, 3.02880859375, 4.078125, 5.12744140625, 6.1767578125, 7.22607421875, 8.275390625, 9.32470703125, 10.3740234375, 11.42333984375, 12.47265625, 13.52197265625, 14.5712890625, 15.62060546875, 16.669921875, 17.71923828125, 18.7685546875, 19.81787109375, 20.8671875, 21.91650390625, 22.9658203125, 24.01513671875, 25.064453125, 26.11376953125, 27.1630859375, 28.21240234375, 29.26171875, 30.31103515625, 31.3603515625, 32.40966796875, 33.458984375, 34.50830078125, 35.5576171875, 36.60693359375, 37.65625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 13.0, 26.0, 100.0, 220.0, 286.0, 234.0, 99.0, 20.0, 7.0, 3.0, 2.0, 1.0], "bins": [-62.753448486328125, -61.642967224121094, -60.5324821472168, -59.422000885009766, -58.31151580810547, -57.20103454589844, -56.090553283691406, -54.98006820678711, -53.86958694458008, -52.75910568237305, -51.64862060546875, -50.53813934326172, -49.42765808105469, -48.31717300415039, -47.20669174194336, -46.09620666503906, -44.98572540283203, -43.875244140625, -42.7647590637207, -41.65427780151367, -40.543792724609375, -39.433311462402344, -38.32283020019531, -37.212345123291016, -36.101863861083984, -34.99138259887695, -33.880897521972656, -32.770416259765625, -31.65993309020996, -30.549449920654297, -29.438968658447266, -28.3284854888916, -27.218006134033203, -26.10752296447754, -24.997039794921875, -23.886558532714844, -22.77607536315918, -21.665592193603516, -20.555110931396484, -19.44462776184082, -18.334144592285156, -17.223661422729492, -16.113178253173828, -15.002696990966797, -13.892213821411133, -12.781730651855469, -11.671248435974121, -10.560766220092773, -9.450282096862793, -8.339799880981445, -7.229316711425781, -6.118834018707275, -5.0083513259887695, -3.8978686332702637, -2.787385940551758, -1.676903247833252, -0.5664205551147461, 0.5440621376037598, 1.6545448303222656, 2.7650275230407715, 3.8755102157592773, 4.985992908477783, 6.096475601196289, 7.206958293914795, 8.3174409866333]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 9.0, 14.0, 5.0, 14.0, 20.0, 20.0, 24.0, 18.0, 26.0, 25.0, 29.0, 42.0, 50.0, 53.0, 60.0, 47.0, 46.0, 48.0, 55.0, 48.0, 50.0, 40.0, 33.0, 40.0, 37.0, 24.0, 23.0, 19.0, 21.0, 20.0, 10.0, 7.0, 10.0, 3.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.25403594970703, -49.77967834472656, -48.305320739746094, -46.830963134765625, -45.356605529785156, -43.88224792480469, -42.40789031982422, -40.93353271484375, -39.45917510986328, -37.98481750488281, -36.510459899902344, -35.036102294921875, -33.561744689941406, -32.08738708496094, -30.6130313873291, -29.138673782348633, -27.664318084716797, -26.189960479736328, -24.71560287475586, -23.24124526977539, -21.766887664794922, -20.292530059814453, -18.818174362182617, -17.34381675720215, -15.86945915222168, -14.395101547241211, -12.920743942260742, -11.44638729095459, -9.972029685974121, -8.497672080993652, -7.0233154296875, -5.548957824707031, -4.074604034423828, -2.6002466678619385, -1.1258893013000488, 0.3484678268432617, 1.8228254318237305, 3.297183036804199, 4.771539688110352, 6.24589729309082, 7.720254898071289, 9.194612503051758, 10.668970108032227, 12.143326759338379, 13.617684364318848, 15.092041969299316, 16.56639862060547, 18.040756225585938, 19.515113830566406, 20.989471435546875, 22.463829040527344, 23.938186645507812, 25.41254425048828, 26.88690185546875, 28.361257553100586, 29.835615158081055, 31.309972763061523, 32.78432846069336, 34.25868606567383, 35.7330436706543, 37.207401275634766, 38.681758880615234, 40.1561164855957, 41.63047409057617, 43.10483169555664]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 5.0, 5.0, 7.0, 8.0, 11.0, 12.0, 19.0, 13.0, 18.0, 21.0, 30.0, 40.0, 29.0, 44.0, 35.0, 27.0, 38.0, 28.0, 44.0, 46.0, 40.0, 37.0, 49.0, 48.0, 43.0, 30.0, 25.0, 36.0, 28.0, 24.0, 20.0, 22.0, 24.0, 13.0, 14.0, 15.0, 13.0, 12.0, 4.0, 2.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.6484375, -4.50909423828125, -4.3697509765625, -4.23040771484375, -4.091064453125, -3.95172119140625, -3.8123779296875, -3.67303466796875, -3.53369140625, -3.39434814453125, -3.2550048828125, -3.11566162109375, -2.976318359375, -2.83697509765625, -2.6976318359375, -2.55828857421875, -2.4189453125, -2.27960205078125, -2.1402587890625, -2.00091552734375, -1.861572265625, -1.72222900390625, -1.5828857421875, -1.44354248046875, -1.30419921875, -1.16485595703125, -1.0255126953125, -0.88616943359375, -0.746826171875, -0.60748291015625, -0.4681396484375, -0.32879638671875, -0.189453125, -0.05010986328125, 0.0892333984375, 0.22857666015625, 0.367919921875, 0.50726318359375, 0.6466064453125, 0.78594970703125, 0.92529296875, 1.06463623046875, 1.2039794921875, 1.34332275390625, 1.482666015625, 1.62200927734375, 1.7613525390625, 1.90069580078125, 2.0400390625, 2.17938232421875, 2.3187255859375, 2.45806884765625, 2.597412109375, 2.73675537109375, 2.8760986328125, 3.01544189453125, 3.15478515625, 3.29412841796875, 3.4334716796875, 3.57281494140625, 3.712158203125, 3.85150146484375, 3.9908447265625, 4.13018798828125, 4.26953125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 7.0, 14.0, 14.0, 16.0, 21.0, 21.0, 27.0, 31.0, 52.0, 54.0, 75.0, 84.0, 116.0, 278.0, 1116.0, 12152.0, 774895.0, 3346999.0, 54178.0, 2957.0, 511.0, 177.0, 97.0, 69.0, 56.0, 39.0, 36.0, 38.0, 27.0, 23.0, 18.0, 11.0, 15.0, 11.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.875, -25.118896484375, -24.36279296875, -23.606689453125, -22.8505859375, -22.094482421875, -21.33837890625, -20.582275390625, -19.826171875, -19.070068359375, -18.31396484375, -17.557861328125, -16.8017578125, -16.045654296875, -15.28955078125, -14.533447265625, -13.77734375, -13.021240234375, -12.26513671875, -11.509033203125, -10.7529296875, -9.996826171875, -9.24072265625, -8.484619140625, -7.728515625, -6.972412109375, -6.21630859375, -5.460205078125, -4.7041015625, -3.947998046875, -3.19189453125, -2.435791015625, -1.6796875, -0.923583984375, -0.16748046875, 0.588623046875, 1.3447265625, 2.100830078125, 2.85693359375, 3.613037109375, 4.369140625, 5.125244140625, 5.88134765625, 6.637451171875, 7.3935546875, 8.149658203125, 8.90576171875, 9.661865234375, 10.41796875, 11.174072265625, 11.93017578125, 12.686279296875, 13.4423828125, 14.198486328125, 14.95458984375, 15.710693359375, 16.466796875, 17.222900390625, 17.97900390625, 18.735107421875, 19.4912109375, 20.247314453125, 21.00341796875, 21.759521484375, 22.515625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 15.0, 19.0, 7.0, 24.0, 33.0, 43.0, 40.0, 57.0, 76.0, 121.0, 140.0, 156.0, 217.0, 297.0, 347.0, 423.0, 375.0, 365.0, 303.0, 204.0, 193.0, 141.0, 99.0, 80.0, 73.0, 49.0, 39.0, 29.0, 24.0, 17.0, 17.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.9442138671875, -8.646240234375, -8.3482666015625, -8.05029296875, -7.7523193359375, -7.454345703125, -7.1563720703125, -6.8583984375, -6.5604248046875, -6.262451171875, -5.9644775390625, -5.66650390625, -5.3685302734375, -5.070556640625, -4.7725830078125, -4.474609375, -4.1766357421875, -3.878662109375, -3.5806884765625, -3.28271484375, -2.9847412109375, -2.686767578125, -2.3887939453125, -2.0908203125, -1.7928466796875, -1.494873046875, -1.1968994140625, -0.89892578125, -0.6009521484375, -0.302978515625, -0.0050048828125, 0.29296875, 0.5909423828125, 0.888916015625, 1.1868896484375, 1.48486328125, 1.7828369140625, 2.080810546875, 2.3787841796875, 2.6767578125, 2.9747314453125, 3.272705078125, 3.5706787109375, 3.86865234375, 4.1666259765625, 4.464599609375, 4.7625732421875, 5.060546875, 5.3585205078125, 5.656494140625, 5.9544677734375, 6.25244140625, 6.5504150390625, 6.848388671875, 7.1463623046875, 7.4443359375, 7.7423095703125, 8.040283203125, 8.3382568359375, 8.63623046875, 8.9342041015625, 9.232177734375, 9.5301513671875, 9.828125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 9.0, 4.0, 13.0, 15.0, 29.0, 25.0, 48.0, 52.0, 64.0, 71.0, 95.0, 116.0, 143.0, 194.0, 283.0, 493.0, 1464.0, 13647.0, 749132.0, 3371453.0, 52091.0, 2865.0, 674.0, 340.0, 239.0, 157.0, 111.0, 101.0, 76.0, 59.0, 52.0, 45.0, 14.0, 24.0, 20.0, 13.0, 18.0, 7.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.90625, -27.84326171875, -26.7802734375, -25.71728515625, -24.654296875, -23.59130859375, -22.5283203125, -21.46533203125, -20.40234375, -19.33935546875, -18.2763671875, -17.21337890625, -16.150390625, -15.08740234375, -14.0244140625, -12.96142578125, -11.8984375, -10.83544921875, -9.7724609375, -8.70947265625, -7.646484375, -6.58349609375, -5.5205078125, -4.45751953125, -3.39453125, -2.33154296875, -1.2685546875, -0.20556640625, 0.857421875, 1.92041015625, 2.9833984375, 4.04638671875, 5.109375, 6.17236328125, 7.2353515625, 8.29833984375, 9.361328125, 10.42431640625, 11.4873046875, 12.55029296875, 13.61328125, 14.67626953125, 15.7392578125, 16.80224609375, 17.865234375, 18.92822265625, 19.9912109375, 21.05419921875, 22.1171875, 23.18017578125, 24.2431640625, 25.30615234375, 26.369140625, 27.43212890625, 28.4951171875, 29.55810546875, 30.62109375, 31.68408203125, 32.7470703125, 33.81005859375, 34.873046875, 35.93603515625, 36.9990234375, 38.06201171875, 39.125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 13.0, 40.0, 76.0, 140.0, 218.0, 217.0, 154.0, 83.0, 44.0, 12.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.778566360473633, -25.900775909423828, -23.022987365722656, -20.145198822021484, -17.26740837097168, -14.389618873596191, -11.511829376220703, -8.634038925170898, -5.756250381469727, -2.8784608840942383, -0.00067138671875, 2.8771181106567383, 5.754907608032227, 8.632697105407715, 11.510486602783203, 14.388277053833008, 17.26606559753418, 20.143856048583984, 23.021644592285156, 25.899433135986328, 28.777223587036133, 31.655014038085938, 34.53280258178711, 37.41059112548828, 40.28838348388672, 43.16617202758789, 46.04396057128906, 48.9217529296875, 51.79954147338867, 54.677330017089844, 57.55512237548828, 60.43291091918945, 63.310699462890625, 66.18849182128906, 69.06627655029297, 71.9440689086914, 74.82185363769531, 77.69964599609375, 80.57743835449219, 83.45523071289062, 86.33301544189453, 89.21080780029297, 92.08859252929688, 94.96638488769531, 97.84417724609375, 100.72196197509766, 103.5997543334961, 106.4775390625, 109.35533142089844, 112.23312377929688, 115.11090850830078, 117.98870086669922, 120.86648559570312, 123.74427795410156, 126.6220703125, 129.49986267089844, 132.37765502929688, 135.2554473876953, 138.13323974609375, 141.01101684570312, 143.88880920410156, 146.7666015625, 149.64439392089844, 152.52218627929688, 155.39996337890625]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 6.0, 9.0, 12.0, 14.0, 16.0, 15.0, 14.0, 14.0, 17.0, 16.0, 30.0, 23.0, 29.0, 27.0, 33.0, 43.0, 40.0, 42.0, 34.0, 39.0, 48.0, 35.0, 28.0, 45.0, 35.0, 30.0, 33.0, 26.0, 25.0, 20.0, 25.0, 21.0, 17.0, 22.0, 13.0, 14.0, 13.0, 11.0, 6.0, 10.0, 8.0, 6.0, 5.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.614334106445312, -28.640439987182617, -27.666547775268555, -26.69265365600586, -25.718761444091797, -24.7448673248291, -23.770973205566406, -22.797080993652344, -21.82318687438965, -20.849292755126953, -19.87540054321289, -18.901506423950195, -17.9276123046875, -16.953720092773438, -15.979825973510742, -15.005932807922363, -14.032039642333984, -13.058146476745605, -12.084253311157227, -11.110359191894531, -10.136466026306152, -9.162572860717773, -8.188678741455078, -7.214785575866699, -6.24089241027832, -5.266999244689941, -4.293105602264404, -3.3192121982574463, -2.3453187942504883, -1.3714256286621094, -0.39753198623657227, 0.5763616561889648, 1.5502548217773438, 2.5241482257843018, 3.4980416297912598, 4.471935272216797, 5.445828437805176, 6.419721603393555, 7.393615245819092, 8.367508888244629, 9.341402053833008, 10.315295219421387, 11.289188385009766, 12.263082504272461, 13.23697566986084, 14.210868835449219, 15.184762954711914, 16.15865707397461, 17.132549285888672, 18.106443405151367, 19.08033561706543, 20.054229736328125, 21.028121948242188, 22.002016067504883, 22.975910186767578, 23.94980239868164, 24.923696517944336, 25.89759063720703, 26.871482849121094, 27.84537696838379, 28.819271087646484, 29.793163299560547, 30.767057418823242, 31.740951538085938, 32.71484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 14.0, 18.0, 13.0, 19.0, 30.0, 20.0, 26.0, 36.0, 31.0, 34.0, 44.0, 34.0, 42.0, 36.0, 28.0, 32.0, 37.0, 44.0, 36.0, 40.0, 34.0, 35.0, 33.0, 29.0, 29.0, 27.0, 26.0, 14.0, 23.0, 17.0, 26.0, 10.0, 12.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.5234375, -4.3868408203125, -4.250244140625, -4.1136474609375, -3.97705078125, -3.8404541015625, -3.703857421875, -3.5672607421875, -3.4306640625, -3.2940673828125, -3.157470703125, -3.0208740234375, -2.88427734375, -2.7476806640625, -2.611083984375, -2.4744873046875, -2.337890625, -2.2012939453125, -2.064697265625, -1.9281005859375, -1.79150390625, -1.6549072265625, -1.518310546875, -1.3817138671875, -1.2451171875, -1.1085205078125, -0.971923828125, -0.8353271484375, -0.69873046875, -0.5621337890625, -0.425537109375, -0.2889404296875, -0.15234375, -0.0157470703125, 0.120849609375, 0.2574462890625, 0.39404296875, 0.5306396484375, 0.667236328125, 0.8038330078125, 0.9404296875, 1.0770263671875, 1.213623046875, 1.3502197265625, 1.48681640625, 1.6234130859375, 1.760009765625, 1.8966064453125, 2.033203125, 2.1697998046875, 2.306396484375, 2.4429931640625, 2.57958984375, 2.7161865234375, 2.852783203125, 2.9893798828125, 3.1259765625, 3.2625732421875, 3.399169921875, 3.5357666015625, 3.67236328125, 3.8089599609375, 3.945556640625, 4.0821533203125, 4.21875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 10.0, 16.0, 25.0, 20.0, 49.0, 77.0, 112.0, 158.0, 262.0, 393.0, 610.0, 898.0, 1466.0, 2260.0, 3491.0, 5534.0, 8680.0, 13908.0, 23463.0, 40485.0, 75046.0, 147212.0, 256414.0, 215325.0, 111782.0, 57901.0, 32297.0, 18997.0, 11660.0, 7238.0, 4590.0, 2811.0, 1815.0, 1235.0, 781.0, 517.0, 342.0, 224.0, 148.0, 112.0, 60.0, 43.0, 34.0, 20.0, 7.0, 8.0, 3.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7509765625, -0.726593017578125, -0.70220947265625, -0.677825927734375, -0.6534423828125, -0.629058837890625, -0.60467529296875, -0.580291748046875, -0.555908203125, -0.531524658203125, -0.50714111328125, -0.482757568359375, -0.4583740234375, -0.433990478515625, -0.40960693359375, -0.385223388671875, -0.36083984375, -0.336456298828125, -0.31207275390625, -0.287689208984375, -0.2633056640625, -0.238922119140625, -0.21453857421875, -0.190155029296875, -0.165771484375, -0.141387939453125, -0.11700439453125, -0.092620849609375, -0.0682373046875, -0.043853759765625, -0.01947021484375, 0.004913330078125, 0.029296875, 0.053680419921875, 0.07806396484375, 0.102447509765625, 0.1268310546875, 0.151214599609375, 0.17559814453125, 0.199981689453125, 0.224365234375, 0.248748779296875, 0.27313232421875, 0.297515869140625, 0.3218994140625, 0.346282958984375, 0.37066650390625, 0.395050048828125, 0.41943359375, 0.443817138671875, 0.46820068359375, 0.492584228515625, 0.5169677734375, 0.541351318359375, 0.56573486328125, 0.590118408203125, 0.614501953125, 0.638885498046875, 0.66326904296875, 0.687652587890625, 0.7120361328125, 0.736419677734375, 0.76080322265625, 0.785186767578125, 0.8095703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 16.0, 14.0, 17.0, 14.0, 17.0, 32.0, 20.0, 28.0, 33.0, 35.0, 40.0, 38.0, 38.0, 47.0, 50.0, 1069.0, 52.0, 34.0, 31.0, 37.0, 36.0, 37.0, 35.0, 27.0, 26.0, 29.0, 18.0, 11.0, 16.0, 11.0, 13.0, 7.0, 17.0, 9.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-3.076171875, -2.988128662109375, -2.90008544921875, -2.812042236328125, -2.7239990234375, -2.635955810546875, -2.54791259765625, -2.459869384765625, -2.371826171875, -2.283782958984375, -2.19573974609375, -2.107696533203125, -2.0196533203125, -1.931610107421875, -1.84356689453125, -1.755523681640625, -1.66748046875, -1.579437255859375, -1.49139404296875, -1.403350830078125, -1.3153076171875, -1.227264404296875, -1.13922119140625, -1.051177978515625, -0.963134765625, -0.875091552734375, -0.78704833984375, -0.699005126953125, -0.6109619140625, -0.522918701171875, -0.43487548828125, -0.346832275390625, -0.2587890625, -0.170745849609375, -0.08270263671875, 0.005340576171875, 0.0933837890625, 0.181427001953125, 0.26947021484375, 0.357513427734375, 0.445556640625, 0.533599853515625, 0.62164306640625, 0.709686279296875, 0.7977294921875, 0.885772705078125, 0.97381591796875, 1.061859130859375, 1.14990234375, 1.237945556640625, 1.32598876953125, 1.414031982421875, 1.5020751953125, 1.590118408203125, 1.67816162109375, 1.766204833984375, 1.854248046875, 1.942291259765625, 2.03033447265625, 2.118377685546875, 2.2064208984375, 2.294464111328125, 2.38250732421875, 2.470550537109375, 2.55859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 18.0, 23.0, 45.0, 52.0, 77.0, 130.0, 165.0, 260.0, 439.0, 595.0, 1008.0, 1606.0, 2525.0, 4139.0, 6757.0, 11422.0, 19449.0, 34005.0, 61358.0, 112590.0, 195856.0, 1282080.0, 159925.0, 87398.0, 48065.0, 27553.0, 15593.0, 9251.0, 5595.0, 3432.0, 2061.0, 1257.0, 836.0, 539.0, 358.0, 214.0, 140.0, 97.0, 64.0, 39.0, 32.0, 13.0, 23.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.53076171875, -0.5143280029296875, -0.497894287109375, -0.4814605712890625, -0.46502685546875, -0.4485931396484375, -0.432159423828125, -0.4157257080078125, -0.3992919921875, -0.3828582763671875, -0.366424560546875, -0.3499908447265625, -0.33355712890625, -0.3171234130859375, -0.300689697265625, -0.2842559814453125, -0.267822265625, -0.2513885498046875, -0.234954833984375, -0.2185211181640625, -0.20208740234375, -0.1856536865234375, -0.169219970703125, -0.1527862548828125, -0.1363525390625, -0.1199188232421875, -0.103485107421875, -0.0870513916015625, -0.07061767578125, -0.0541839599609375, -0.037750244140625, -0.0213165283203125, -0.0048828125, 0.0115509033203125, 0.027984619140625, 0.0444183349609375, 0.06085205078125, 0.0772857666015625, 0.093719482421875, 0.1101531982421875, 0.1265869140625, 0.1430206298828125, 0.159454345703125, 0.1758880615234375, 0.19232177734375, 0.2087554931640625, 0.225189208984375, 0.2416229248046875, 0.258056640625, 0.2744903564453125, 0.290924072265625, 0.3073577880859375, 0.32379150390625, 0.3402252197265625, 0.356658935546875, 0.3730926513671875, 0.3895263671875, 0.4059600830078125, 0.422393798828125, 0.4388275146484375, 0.45526123046875, 0.4716949462890625, 0.488128662109375, 0.5045623779296875, 0.52099609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 7.0, 12.0, 20.0, 14.0, 18.0, 19.0, 18.0, 18.0, 25.0, 25.0, 32.0, 50.0, 34.0, 45.0, 47.0, 43.0, 57.0, 51.0, 41.0, 46.0, 33.0, 36.0, 39.0, 36.0, 34.0, 22.0, 30.0, 21.0, 19.0, 18.0, 16.0, 11.0, 4.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00141143798828125, -0.0013677775859832764, -0.0013241171836853027, -0.001280456781387329, -0.0012367963790893555, -0.0011931359767913818, -0.0011494755744934082, -0.0011058151721954346, -0.001062154769897461, -0.0010184943675994873, -0.0009748339653015137, -0.00093117356300354, -0.0008875131607055664, -0.0008438527584075928, -0.0008001923561096191, -0.0007565319538116455, -0.0007128715515136719, -0.0006692111492156982, -0.0006255507469177246, -0.000581890344619751, -0.0005382299423217773, -0.0004945695400238037, -0.0004509091377258301, -0.00040724873542785645, -0.0003635883331298828, -0.0003199279308319092, -0.00027626752853393555, -0.00023260712623596191, -0.00018894672393798828, -0.00014528632164001465, -0.00010162591934204102, -5.796551704406738e-05, -1.430511474609375e-05, 2.9355287551879883e-05, 7.301568984985352e-05, 0.00011667609214782715, 0.00016033649444580078, 0.00020399689674377441, 0.00024765729904174805, 0.0002913177013397217, 0.0003349781036376953, 0.00037863850593566895, 0.0004222989082336426, 0.0004659593105316162, 0.0005096197128295898, 0.0005532801151275635, 0.0005969405174255371, 0.0006406009197235107, 0.0006842613220214844, 0.000727921724319458, 0.0007715821266174316, 0.0008152425289154053, 0.0008589029312133789, 0.0009025633335113525, 0.0009462237358093262, 0.0009898841381072998, 0.0010335445404052734, 0.001077204942703247, 0.0011208653450012207, 0.0011645257472991943, 0.001208186149597168, 0.0012518465518951416, 0.0012955069541931152, 0.0013391673564910889, 0.0013828277587890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 8.0, 8.0, 11.0, 27.0, 23.0, 24.0, 37.0, 52.0, 72.0, 104.0, 134.0, 231.0, 401.0, 772.0, 7304.0, 932237.0, 103894.0, 1785.0, 534.0, 283.0, 176.0, 129.0, 66.0, 53.0, 33.0, 36.0, 25.0, 14.0, 18.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0401611328125, -0.03889656066894531, -0.037631988525390625, -0.03636741638183594, -0.03510284423828125, -0.03383827209472656, -0.032573699951171875, -0.03130912780761719, -0.0300445556640625, -0.028779983520507812, -0.027515411376953125, -0.026250839233398438, -0.02498626708984375, -0.023721694946289062, -0.022457122802734375, -0.021192550659179688, -0.019927978515625, -0.018663406372070312, -0.017398834228515625, -0.016134262084960938, -0.01486968994140625, -0.013605117797851562, -0.012340545654296875, -0.011075973510742188, -0.0098114013671875, -0.008546829223632812, -0.007282257080078125, -0.0060176849365234375, -0.00475311279296875, -0.0034885406494140625, -0.002223968505859375, -0.0009593963623046875, 0.00030517578125, 0.0015697479248046875, 0.002834320068359375, 0.0040988922119140625, 0.00536346435546875, 0.0066280364990234375, 0.007892608642578125, 0.009157180786132812, 0.0104217529296875, 0.011686325073242188, 0.012950897216796875, 0.014215469360351562, 0.01548004150390625, 0.016744613647460938, 0.018009185791015625, 0.019273757934570312, 0.020538330078125, 0.021802902221679688, 0.023067474365234375, 0.024332046508789062, 0.02559661865234375, 0.026861190795898438, 0.028125762939453125, 0.029390335083007812, 0.0306549072265625, 0.03191947937011719, 0.033184051513671875, 0.03444862365722656, 0.03571319580078125, 0.03697776794433594, 0.038242340087890625, 0.03950691223144531, 0.040771484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 364.0, 642.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007213766220957041, -0.006619041319936514, -0.006024316884577274, -0.0054295919835567474, -0.0048348670825362206, -0.004240142181515694, -0.0036454175133258104, -0.003050692845135927, -0.0024559679441154003, -0.0018612431595101953, -0.0012665183749049902, -0.0006717935902997851, -7.706880569458008e-05, 0.0005176560953259468, 0.00111238076351583, 0.0017071054317057133, 0.00230183033272624, 0.002896555233746767, 0.0034912799019366503, 0.0040860045701265335, 0.00468072947114706, 0.005275454372167587, 0.005870179273188114, 0.006464903708547354, 0.007059628609567881, 0.0076543535105884075, 0.008249077945947647, 0.008843802846968174, 0.0094385277479887, 0.010033252649009228, 0.010627977550029755, 0.011222701519727707, 0.011817427352070808, 0.012412152253091335, 0.013006877154111862, 0.013601602055132389, 0.014196326956152916, 0.014791050925850868, 0.015385775826871395, 0.015980500727891922, 0.016575224697589874, 0.017169948667287827, 0.017764674499630928, 0.01835939846932888, 0.018954124301671982, 0.019548848271369934, 0.020143574103713036, 0.020738298073410988, 0.02133302390575409, 0.02192774787545204, 0.022522473707795143, 0.023117197677493095, 0.023711923509836197, 0.02430664747953415, 0.02490137331187725, 0.025496097281575203, 0.026090823113918304, 0.026685547083616257, 0.027280272915959358, 0.02787499688565731, 0.028469722718000412, 0.029064446687698364, 0.029659172520041466, 0.030253896489739418, 0.03084862045943737]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 8.0, 6.0, 3.0, 8.0, 7.0, 14.0, 12.0, 17.0, 15.0, 25.0, 29.0, 20.0, 32.0, 28.0, 38.0, 41.0, 40.0, 46.0, 48.0, 52.0, 56.0, 48.0, 48.0, 47.0, 49.0, 37.0, 40.0, 35.0, 18.0, 21.0, 19.0, 16.0, 15.0, 15.0, 16.0, 3.0, 3.0, 11.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009328126907348633, -0.0009030187502503395, -0.0008732248097658157, -0.000843430869281292, -0.0008136369287967682, -0.0007838429883122444, -0.0007540490478277206, -0.0007242551073431969, -0.0006944611668586731, -0.0006646672263741493, -0.0006348732858896255, -0.0006050793454051018, -0.000575285404920578, -0.0005454914644360542, -0.0005156975239515305, -0.0004859035834670067, -0.0004561096429824829, -0.00042631570249795914, -0.00039652176201343536, -0.0003667278215289116, -0.0003369338810443878, -0.00030713994055986404, -0.00027734600007534027, -0.0002475520595908165, -0.00021775811910629272, -0.00018796417862176895, -0.00015817023813724518, -0.0001283762976527214, -9.858235716819763e-05, -6.878841668367386e-05, -3.8994476199150085e-05, -9.200535714626312e-06, 2.059340476989746e-05, 5.0387345254421234e-05, 8.018128573894501e-05, 0.00010997522622346878, 0.00013976916670799255, 0.00016956310719251633, 0.0001993570476770401, 0.00022915098816156387, 0.00025894492864608765, 0.0002887388691306114, 0.0003185328096151352, 0.00034832675009965897, 0.00037812069058418274, 0.0004079146310687065, 0.0004377085715532303, 0.00046750251203775406, 0.0004972964525222778, 0.0005270903930068016, 0.0005568843334913254, 0.0005866782739758492, 0.0006164722144603729, 0.0006462661549448967, 0.0006760600954294205, 0.0007058540359139442, 0.000735647976398468, 0.0007654419168829918, 0.0007952358573675156, 0.0008250297978520393, 0.0008548237383365631, 0.0008846176788210869, 0.0009144116193056107, 0.0009442055597901344, 0.0009739995002746582]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 14.0, 18.0, 13.0, 19.0, 30.0, 20.0, 26.0, 36.0, 31.0, 34.0, 44.0, 34.0, 42.0, 36.0, 28.0, 32.0, 37.0, 44.0, 36.0, 40.0, 34.0, 35.0, 33.0, 29.0, 29.0, 27.0, 26.0, 14.0, 23.0, 17.0, 26.0, 10.0, 12.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.5234375, -4.3868408203125, -4.250244140625, -4.1136474609375, -3.97705078125, -3.8404541015625, -3.703857421875, -3.5672607421875, -3.4306640625, -3.2940673828125, -3.157470703125, -3.0208740234375, -2.88427734375, -2.7476806640625, -2.611083984375, -2.4744873046875, -2.337890625, -2.2012939453125, -2.064697265625, -1.9281005859375, -1.79150390625, -1.6549072265625, -1.518310546875, -1.3817138671875, -1.2451171875, -1.1085205078125, -0.971923828125, -0.8353271484375, -0.69873046875, -0.5621337890625, -0.425537109375, -0.2889404296875, -0.15234375, -0.0157470703125, 0.120849609375, 0.2574462890625, 0.39404296875, 0.5306396484375, 0.667236328125, 0.8038330078125, 0.9404296875, 1.0770263671875, 1.213623046875, 1.3502197265625, 1.48681640625, 1.6234130859375, 1.760009765625, 1.8966064453125, 2.033203125, 2.1697998046875, 2.306396484375, 2.4429931640625, 2.57958984375, 2.7161865234375, 2.852783203125, 2.9893798828125, 3.1259765625, 3.2625732421875, 3.399169921875, 3.5357666015625, 3.67236328125, 3.8089599609375, 3.945556640625, 4.0821533203125, 4.21875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 13.0, 9.0, 26.0, 27.0, 34.0, 52.0, 64.0, 125.0, 164.0, 269.0, 419.0, 715.0, 1185.0, 2142.0, 3516.0, 6099.0, 10663.0, 19423.0, 38587.0, 86865.0, 270870.0, 384790.0, 119545.0, 48566.0, 23858.0, 12763.0, 7380.0, 4211.0, 2430.0, 1497.0, 858.0, 493.0, 284.0, 190.0, 139.0, 76.0, 58.0, 43.0, 31.0, 19.0, 11.0, 13.0, 14.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1875, -3.09136962890625, -2.9952392578125, -2.89910888671875, -2.802978515625, -2.70684814453125, -2.6107177734375, -2.51458740234375, -2.41845703125, -2.32232666015625, -2.2261962890625, -2.13006591796875, -2.033935546875, -1.93780517578125, -1.8416748046875, -1.74554443359375, -1.6494140625, -1.55328369140625, -1.4571533203125, -1.36102294921875, -1.264892578125, -1.16876220703125, -1.0726318359375, -0.97650146484375, -0.88037109375, -0.78424072265625, -0.6881103515625, -0.59197998046875, -0.495849609375, -0.39971923828125, -0.3035888671875, -0.20745849609375, -0.111328125, -0.01519775390625, 0.0809326171875, 0.17706298828125, 0.273193359375, 0.36932373046875, 0.4654541015625, 0.56158447265625, 0.65771484375, 0.75384521484375, 0.8499755859375, 0.94610595703125, 1.042236328125, 1.13836669921875, 1.2344970703125, 1.33062744140625, 1.4267578125, 1.52288818359375, 1.6190185546875, 1.71514892578125, 1.811279296875, 1.90740966796875, 2.0035400390625, 2.09967041015625, 2.19580078125, 2.29193115234375, 2.3880615234375, 2.48419189453125, 2.580322265625, 2.67645263671875, 2.7725830078125, 2.86871337890625, 2.96484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 5.0, 10.0, 11.0, 7.0, 11.0, 23.0, 18.0, 20.0, 22.0, 22.0, 29.0, 35.0, 43.0, 38.0, 37.0, 72.0, 179.0, 1693.0, 225.0, 81.0, 65.0, 44.0, 45.0, 40.0, 32.0, 33.0, 28.0, 24.0, 20.0, 31.0, 22.0, 13.0, 12.0, 10.0, 7.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.2845458984375, -12.764404296875, -12.2442626953125, -11.72412109375, -11.2039794921875, -10.683837890625, -10.1636962890625, -9.6435546875, -9.1234130859375, -8.603271484375, -8.0831298828125, -7.56298828125, -7.0428466796875, -6.522705078125, -6.0025634765625, -5.482421875, -4.9622802734375, -4.442138671875, -3.9219970703125, -3.40185546875, -2.8817138671875, -2.361572265625, -1.8414306640625, -1.3212890625, -0.8011474609375, -0.281005859375, 0.2391357421875, 0.75927734375, 1.2794189453125, 1.799560546875, 2.3197021484375, 2.83984375, 3.3599853515625, 3.880126953125, 4.4002685546875, 4.92041015625, 5.4405517578125, 5.960693359375, 6.4808349609375, 7.0009765625, 7.5211181640625, 8.041259765625, 8.5614013671875, 9.08154296875, 9.6016845703125, 10.121826171875, 10.6419677734375, 11.162109375, 11.6822509765625, 12.202392578125, 12.7225341796875, 13.24267578125, 13.7628173828125, 14.282958984375, 14.8031005859375, 15.3232421875, 15.8433837890625, 16.363525390625, 16.8836669921875, 17.40380859375, 17.9239501953125, 18.444091796875, 18.9642333984375, 19.484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 13.0, 13.0, 10.0, 21.0, 32.0, 40.0, 56.0, 72.0, 97.0, 179.0, 279.0, 556.0, 2920.0, 2910897.0, 227915.0, 1542.0, 423.0, 230.0, 128.0, 76.0, 61.0, 38.0, 19.0, 26.0, 14.0, 12.0, 5.0, 7.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.53662109375, -44.9794921875, -43.42236328125, -41.865234375, -40.30810546875, -38.7509765625, -37.19384765625, -35.63671875, -34.07958984375, -32.5224609375, -30.96533203125, -29.408203125, -27.85107421875, -26.2939453125, -24.73681640625, -23.1796875, -21.62255859375, -20.0654296875, -18.50830078125, -16.951171875, -15.39404296875, -13.8369140625, -12.27978515625, -10.72265625, -9.16552734375, -7.6083984375, -6.05126953125, -4.494140625, -2.93701171875, -1.3798828125, 0.17724609375, 1.734375, 3.29150390625, 4.8486328125, 6.40576171875, 7.962890625, 9.52001953125, 11.0771484375, 12.63427734375, 14.19140625, 15.74853515625, 17.3056640625, 18.86279296875, 20.419921875, 21.97705078125, 23.5341796875, 25.09130859375, 26.6484375, 28.20556640625, 29.7626953125, 31.31982421875, 32.876953125, 34.43408203125, 35.9912109375, 37.54833984375, 39.10546875, 40.66259765625, 42.2197265625, 43.77685546875, 45.333984375, 46.89111328125, 48.4482421875, 50.00537109375, 51.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 187.0, 759.0, 69.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.774166107177734, -20.15549087524414, -15.53681468963623, -10.91813850402832, -6.299463272094727, -1.6807880401611328, 2.9378890991210938, 7.5565643310546875, 12.175239562988281, 16.793914794921875, 21.41259002685547, 26.031267166137695, 30.64994239807129, 35.26861572265625, 39.88729476928711, 44.5059700012207, 49.1246452331543, 53.74332046508789, 58.361995697021484, 62.980674743652344, 67.59934997558594, 72.21802520751953, 76.83670043945312, 81.45537567138672, 86.07405090332031, 90.6927261352539, 95.3114013671875, 99.9300765991211, 104.54875183105469, 109.16742706298828, 113.78610229492188, 118.40478515625, 123.02345275878906, 127.64212799072266, 132.26080322265625, 136.87948608398438, 141.49815368652344, 146.11683654785156, 150.73550415039062, 155.35418701171875, 159.9728546142578, 164.59153747558594, 169.210205078125, 173.82888793945312, 178.4475555419922, 183.0662384033203, 187.68490600585938, 192.3035888671875, 196.92227172851562, 201.54095458984375, 206.1596221923828, 210.77830505371094, 215.39697265625, 220.01565551757812, 224.6343231201172, 229.2530059814453, 233.87167358398438, 238.4903564453125, 243.10902404785156, 247.7277069091797, 252.34637451171875, 256.9650573730469, 261.583740234375, 266.202392578125, 270.8210754394531]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 5.0, 14.0, 5.0, 5.0, 19.0, 18.0, 16.0, 18.0, 19.0, 26.0, 24.0, 27.0, 31.0, 37.0, 37.0, 40.0, 46.0, 35.0, 36.0, 40.0, 42.0, 44.0, 34.0, 37.0, 39.0, 30.0, 31.0, 33.0, 33.0, 37.0, 22.0, 19.0, 18.0, 18.0, 15.0, 6.0, 1.0, 13.0, 6.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.74343490600586, -43.338130950927734, -41.932823181152344, -40.52751922607422, -39.12221145629883, -37.7169075012207, -36.31159973144531, -34.90629577636719, -33.5009880065918, -32.09568405151367, -30.69037628173828, -29.285070419311523, -27.879764556884766, -26.474458694458008, -25.06915283203125, -23.663848876953125, -22.258543014526367, -20.85323715209961, -19.44793128967285, -18.042625427246094, -16.637319564819336, -15.232013702392578, -13.826708793640137, -12.421402931213379, -11.016097068786621, -9.610791206359863, -8.205485343933105, -6.800179958343506, -5.394874095916748, -3.9895682334899902, -2.5842628479003906, -1.1789569854736328, 0.226348876953125, 1.6316546201705933, 3.0369603633880615, 4.44226598739624, 5.847571849822998, 7.252877712249756, 8.658183097839355, 10.063488960266113, 11.468794822692871, 12.874100685119629, 14.279406547546387, 15.684711456298828, 17.090017318725586, 18.495323181152344, 19.9006290435791, 21.30593490600586, 22.711240768432617, 24.116546630859375, 25.521852493286133, 26.92715835571289, 28.33246421813965, 29.737770080566406, 31.14307403564453, 32.54838180541992, 33.95368576049805, 35.35898971557617, 36.76429748535156, 38.16960144042969, 39.57490921020508, 40.9802131652832, 42.385520935058594, 43.79082489013672, 45.19613265991211]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 5.0, 10.0, 10.0, 11.0, 9.0, 17.0, 18.0, 14.0, 30.0, 30.0, 32.0, 30.0, 34.0, 38.0, 38.0, 29.0, 43.0, 39.0, 39.0, 32.0, 34.0, 48.0, 50.0, 35.0, 27.0, 30.0, 23.0, 30.0, 30.0, 26.0, 25.0, 21.0, 22.0, 16.0, 14.0, 13.0, 5.0, 10.0, 5.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.55474853515625, -4.4102783203125, -4.26580810546875, -4.121337890625, -3.97686767578125, -3.8323974609375, -3.68792724609375, -3.54345703125, -3.39898681640625, -3.2545166015625, -3.11004638671875, -2.965576171875, -2.82110595703125, -2.6766357421875, -2.53216552734375, -2.3876953125, -2.24322509765625, -2.0987548828125, -1.95428466796875, -1.809814453125, -1.66534423828125, -1.5208740234375, -1.37640380859375, -1.23193359375, -1.08746337890625, -0.9429931640625, -0.79852294921875, -0.654052734375, -0.50958251953125, -0.3651123046875, -0.22064208984375, -0.076171875, 0.06829833984375, 0.2127685546875, 0.35723876953125, 0.501708984375, 0.64617919921875, 0.7906494140625, 0.93511962890625, 1.07958984375, 1.22406005859375, 1.3685302734375, 1.51300048828125, 1.657470703125, 1.80194091796875, 1.9464111328125, 2.09088134765625, 2.2353515625, 2.37982177734375, 2.5242919921875, 2.66876220703125, 2.813232421875, 2.95770263671875, 3.1021728515625, 3.24664306640625, 3.39111328125, 3.53558349609375, 3.6800537109375, 3.82452392578125, 3.968994140625, 4.11346435546875, 4.2579345703125, 4.40240478515625, 4.546875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 14.0, 22.0, 20.0, 26.0, 45.0, 59.0, 72.0, 102.0, 149.0, 222.0, 322.0, 541.0, 1027.0, 1993.0, 4663.0, 13065.0, 48782.0, 262994.0, 1251775.0, 1857373.0, 607925.0, 104905.0, 23947.0, 7720.0, 2978.0, 1409.0, 725.0, 432.0, 266.0, 192.0, 146.0, 94.0, 64.0, 37.0, 49.0, 21.0, 18.0, 12.0, 14.0, 12.0, 5.0, 10.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.56640625, -6.32537841796875, -6.0843505859375, -5.84332275390625, -5.602294921875, -5.36126708984375, -5.1202392578125, -4.87921142578125, -4.63818359375, -4.39715576171875, -4.1561279296875, -3.91510009765625, -3.674072265625, -3.43304443359375, -3.1920166015625, -2.95098876953125, -2.7099609375, -2.46893310546875, -2.2279052734375, -1.98687744140625, -1.745849609375, -1.50482177734375, -1.2637939453125, -1.02276611328125, -0.78173828125, -0.54071044921875, -0.2996826171875, -0.05865478515625, 0.182373046875, 0.42340087890625, 0.6644287109375, 0.90545654296875, 1.146484375, 1.38751220703125, 1.6285400390625, 1.86956787109375, 2.110595703125, 2.35162353515625, 2.5926513671875, 2.83367919921875, 3.07470703125, 3.31573486328125, 3.5567626953125, 3.79779052734375, 4.038818359375, 4.27984619140625, 4.5208740234375, 4.76190185546875, 5.0029296875, 5.24395751953125, 5.4849853515625, 5.72601318359375, 5.967041015625, 6.20806884765625, 6.4490966796875, 6.69012451171875, 6.93115234375, 7.17218017578125, 7.4132080078125, 7.65423583984375, 7.895263671875, 8.13629150390625, 8.3773193359375, 8.61834716796875, 8.859375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 8.0, 9.0, 7.0, 15.0, 25.0, 36.0, 52.0, 84.0, 98.0, 145.0, 191.0, 235.0, 361.0, 412.0, 448.0, 507.0, 375.0, 301.0, 218.0, 154.0, 112.0, 74.0, 58.0, 40.0, 33.0, 24.0, 18.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -10.96728515625, -10.5986328125, -10.22998046875, -9.861328125, -9.49267578125, -9.1240234375, -8.75537109375, -8.38671875, -8.01806640625, -7.6494140625, -7.28076171875, -6.912109375, -6.54345703125, -6.1748046875, -5.80615234375, -5.4375, -5.06884765625, -4.7001953125, -4.33154296875, -3.962890625, -3.59423828125, -3.2255859375, -2.85693359375, -2.48828125, -2.11962890625, -1.7509765625, -1.38232421875, -1.013671875, -0.64501953125, -0.2763671875, 0.09228515625, 0.4609375, 0.82958984375, 1.1982421875, 1.56689453125, 1.935546875, 2.30419921875, 2.6728515625, 3.04150390625, 3.41015625, 3.77880859375, 4.1474609375, 4.51611328125, 4.884765625, 5.25341796875, 5.6220703125, 5.99072265625, 6.359375, 6.72802734375, 7.0966796875, 7.46533203125, 7.833984375, 8.20263671875, 8.5712890625, 8.93994140625, 9.30859375, 9.67724609375, 10.0458984375, 10.41455078125, 10.783203125, 11.15185546875, 11.5205078125, 11.88916015625, 12.2578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 12.0, 9.0, 21.0, 24.0, 41.0, 42.0, 52.0, 97.0, 112.0, 169.0, 223.0, 550.0, 1685.0, 37444.0, 3770563.0, 376571.0, 4780.0, 796.0, 347.0, 216.0, 150.0, 95.0, 68.0, 47.0, 39.0, 33.0, 25.0, 11.0, 11.0, 16.0, 3.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.607421875, -31.33984375, -30.072265625, -28.8046875, -27.537109375, -26.26953125, -25.001953125, -23.734375, -22.466796875, -21.19921875, -19.931640625, -18.6640625, -17.396484375, -16.12890625, -14.861328125, -13.59375, -12.326171875, -11.05859375, -9.791015625, -8.5234375, -7.255859375, -5.98828125, -4.720703125, -3.453125, -2.185546875, -0.91796875, 0.349609375, 1.6171875, 2.884765625, 4.15234375, 5.419921875, 6.6875, 7.955078125, 9.22265625, 10.490234375, 11.7578125, 13.025390625, 14.29296875, 15.560546875, 16.828125, 18.095703125, 19.36328125, 20.630859375, 21.8984375, 23.166015625, 24.43359375, 25.701171875, 26.96875, 28.236328125, 29.50390625, 30.771484375, 32.0390625, 33.306640625, 34.57421875, 35.841796875, 37.109375, 38.376953125, 39.64453125, 40.912109375, 42.1796875, 43.447265625, 44.71484375, 45.982421875, 47.25]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 74.0, 270.0, 376.0, 226.0, 44.0, 11.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75665283203125, -65.4729232788086, -60.18919372558594, -54.905460357666016, -49.62173080444336, -44.3380012512207, -39.05426788330078, -33.770538330078125, -28.48680877685547, -23.203079223632812, -17.919347763061523, -12.63561725616455, -7.351886749267578, -2.068157196044922, 3.215574264526367, 8.499305725097656, 13.783035278320312, 19.06676483154297, 24.350496292114258, 29.634227752685547, 34.9179573059082, 40.20168685913086, 45.48542022705078, 50.76914978027344, 56.052879333496094, 61.33660888671875, 66.6203384399414, 71.90406799316406, 77.18780517578125, 82.47152709960938, 87.75526428222656, 93.03899383544922, 98.32272338867188, 103.60645294189453, 108.89018249511719, 114.17391204833984, 119.4576416015625, 124.74137878417969, 130.0251007080078, 135.308837890625, 140.59255981445312, 145.8762969970703, 151.16001892089844, 156.44375610351562, 161.72747802734375, 167.01121520996094, 172.29493713378906, 177.57867431640625, 182.86241149902344, 188.14614868164062, 193.42987060546875, 198.71360778808594, 203.99732971191406, 209.28106689453125, 214.56478881835938, 219.84852600097656, 225.13226318359375, 230.41600036621094, 235.69972229003906, 240.98345947265625, 246.26718139648438, 251.55091857910156, 256.83465576171875, 262.1183776855469, 267.402099609375]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 5.0, 11.0, 9.0, 18.0, 9.0, 20.0, 15.0, 19.0, 19.0, 22.0, 24.0, 28.0, 26.0, 46.0, 31.0, 45.0, 38.0, 41.0, 32.0, 43.0, 48.0, 37.0, 34.0, 38.0, 36.0, 26.0, 29.0, 34.0, 17.0, 24.0, 22.0, 23.0, 23.0, 18.0, 14.0, 20.0, 6.0, 12.0, 6.0, 5.0, 6.0, 0.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.296630859375, -32.26353454589844, -31.23044204711914, -30.19734764099121, -29.16425323486328, -28.13115882873535, -27.098064422607422, -26.064970016479492, -25.031875610351562, -23.998781204223633, -22.965686798095703, -21.932592391967773, -20.899497985839844, -19.866403579711914, -18.833309173583984, -17.800214767456055, -16.767120361328125, -15.734025955200195, -14.700931549072266, -13.667837142944336, -12.634742736816406, -11.601648330688477, -10.568553924560547, -9.535459518432617, -8.502365112304688, -7.469270706176758, -6.436176300048828, -5.403081893920898, -4.369987487792969, -3.336893081665039, -2.3037986755371094, -1.2707042694091797, -0.23760986328125, 0.7954845428466797, 1.8285789489746094, 2.861673355102539, 3.8947677612304688, 4.927862167358398, 5.960956573486328, 6.994050979614258, 8.027145385742188, 9.060239791870117, 10.093334197998047, 11.126428604125977, 12.159523010253906, 13.192617416381836, 14.225711822509766, 15.258806228637695, 16.291900634765625, 17.324995040893555, 18.358089447021484, 19.391183853149414, 20.424278259277344, 21.457372665405273, 22.490467071533203, 23.523561477661133, 24.556655883789062, 25.589750289916992, 26.622844696044922, 27.65593910217285, 28.68903350830078, 29.72212791442871, 30.75522232055664, 31.78831672668457, 32.8214111328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 15.0, 17.0, 17.0, 21.0, 29.0, 33.0, 32.0, 32.0, 40.0, 38.0, 46.0, 44.0, 42.0, 42.0, 51.0, 42.0, 46.0, 40.0, 44.0, 40.0, 35.0, 38.0, 38.0, 26.0, 26.0, 19.0, 15.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99505615234375, -4.8260498046875, -4.65704345703125, -4.488037109375, -4.31903076171875, -4.1500244140625, -3.98101806640625, -3.81201171875, -3.64300537109375, -3.4739990234375, -3.30499267578125, -3.135986328125, -2.96697998046875, -2.7979736328125, -2.62896728515625, -2.4599609375, -2.29095458984375, -2.1219482421875, -1.95294189453125, -1.783935546875, -1.61492919921875, -1.4459228515625, -1.27691650390625, -1.10791015625, -0.93890380859375, -0.7698974609375, -0.60089111328125, -0.431884765625, -0.26287841796875, -0.0938720703125, 0.07513427734375, 0.244140625, 0.41314697265625, 0.5821533203125, 0.75115966796875, 0.920166015625, 1.08917236328125, 1.2581787109375, 1.42718505859375, 1.59619140625, 1.76519775390625, 1.9342041015625, 2.10321044921875, 2.272216796875, 2.44122314453125, 2.6102294921875, 2.77923583984375, 2.9482421875, 3.11724853515625, 3.2862548828125, 3.45526123046875, 3.624267578125, 3.79327392578125, 3.9622802734375, 4.13128662109375, 4.30029296875, 4.46929931640625, 4.6383056640625, 4.80731201171875, 4.976318359375, 5.14532470703125, 5.3143310546875, 5.48333740234375, 5.65234375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 11.0, 13.0, 21.0, 34.0, 49.0, 56.0, 79.0, 107.0, 136.0, 200.0, 303.0, 424.0, 646.0, 907.0, 1370.0, 2016.0, 2831.0, 4187.0, 6236.0, 9394.0, 14321.0, 22065.0, 34259.0, 55022.0, 89569.0, 148893.0, 207474.0, 168601.0, 103533.0, 63244.0, 39051.0, 24920.0, 15895.0, 10536.0, 7142.0, 4708.0, 3257.0, 2242.0, 1520.0, 1053.0, 676.0, 495.0, 341.0, 210.0, 149.0, 115.0, 71.0, 53.0, 38.0, 32.0, 23.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.572265625, -0.5535888671875, -0.534912109375, -0.5162353515625, -0.49755859375, -0.4788818359375, -0.460205078125, -0.4415283203125, -0.4228515625, -0.4041748046875, -0.385498046875, -0.3668212890625, -0.34814453125, -0.3294677734375, -0.310791015625, -0.2921142578125, -0.2734375, -0.2547607421875, -0.236083984375, -0.2174072265625, -0.19873046875, -0.1800537109375, -0.161376953125, -0.1427001953125, -0.1240234375, -0.1053466796875, -0.086669921875, -0.0679931640625, -0.04931640625, -0.0306396484375, -0.011962890625, 0.0067138671875, 0.025390625, 0.0440673828125, 0.062744140625, 0.0814208984375, 0.10009765625, 0.1187744140625, 0.137451171875, 0.1561279296875, 0.1748046875, 0.1934814453125, 0.212158203125, 0.2308349609375, 0.24951171875, 0.2681884765625, 0.286865234375, 0.3055419921875, 0.32421875, 0.3428955078125, 0.361572265625, 0.3802490234375, 0.39892578125, 0.4176025390625, 0.436279296875, 0.4549560546875, 0.4736328125, 0.4923095703125, 0.510986328125, 0.5296630859375, 0.54833984375, 0.5670166015625, 0.585693359375, 0.6043701171875, 0.623046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 12.0, 7.0, 11.0, 11.0, 12.0, 17.0, 31.0, 36.0, 40.0, 31.0, 39.0, 51.0, 43.0, 37.0, 58.0, 1092.0, 59.0, 54.0, 48.0, 43.0, 44.0, 28.0, 42.0, 21.0, 34.0, 16.0, 28.0, 21.0, 14.0, 12.0, 8.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.16015625, -3.04095458984375, -2.9217529296875, -2.80255126953125, -2.683349609375, -2.56414794921875, -2.4449462890625, -2.32574462890625, -2.20654296875, -2.08734130859375, -1.9681396484375, -1.84893798828125, -1.729736328125, -1.61053466796875, -1.4913330078125, -1.37213134765625, -1.2529296875, -1.13372802734375, -1.0145263671875, -0.89532470703125, -0.776123046875, -0.65692138671875, -0.5377197265625, -0.41851806640625, -0.29931640625, -0.18011474609375, -0.0609130859375, 0.05828857421875, 0.177490234375, 0.29669189453125, 0.4158935546875, 0.53509521484375, 0.654296875, 0.77349853515625, 0.8927001953125, 1.01190185546875, 1.131103515625, 1.25030517578125, 1.3695068359375, 1.48870849609375, 1.60791015625, 1.72711181640625, 1.8463134765625, 1.96551513671875, 2.084716796875, 2.20391845703125, 2.3231201171875, 2.44232177734375, 2.5615234375, 2.68072509765625, 2.7999267578125, 2.91912841796875, 3.038330078125, 3.15753173828125, 3.2767333984375, 3.39593505859375, 3.51513671875, 3.63433837890625, 3.7535400390625, 3.87274169921875, 3.991943359375, 4.11114501953125, 4.2303466796875, 4.34954833984375, 4.46875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 14.0, 9.0, 33.0, 47.0, 59.0, 116.0, 184.0, 317.0, 507.0, 972.0, 1786.0, 3371.0, 6347.0, 12190.0, 24481.0, 51877.0, 113925.0, 243317.0, 1343093.0, 156745.0, 70913.0, 33023.0, 16154.0, 8192.0, 4359.0, 2259.0, 1234.0, 682.0, 374.0, 222.0, 108.0, 78.0, 52.0, 36.0, 16.0, 17.0, 10.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79248046875, -0.7693099975585938, -0.7461395263671875, -0.7229690551757812, -0.699798583984375, -0.6766281127929688, -0.6534576416015625, -0.6302871704101562, -0.60711669921875, -0.5839462280273438, -0.5607757568359375, -0.5376052856445312, -0.514434814453125, -0.49126434326171875, -0.4680938720703125, -0.44492340087890625, -0.4217529296875, -0.39858245849609375, -0.3754119873046875, -0.35224151611328125, -0.329071044921875, -0.30590057373046875, -0.2827301025390625, -0.25955963134765625, -0.23638916015625, -0.21321868896484375, -0.1900482177734375, -0.16687774658203125, -0.143707275390625, -0.12053680419921875, -0.0973663330078125, -0.07419586181640625, -0.051025390625, -0.02785491943359375, -0.0046844482421875, 0.01848602294921875, 0.041656494140625, 0.06482696533203125, 0.0879974365234375, 0.11116790771484375, 0.13433837890625, 0.15750885009765625, 0.1806793212890625, 0.20384979248046875, 0.227020263671875, 0.25019073486328125, 0.2733612060546875, 0.29653167724609375, 0.3197021484375, 0.34287261962890625, 0.3660430908203125, 0.38921356201171875, 0.412384033203125, 0.43555450439453125, 0.4587249755859375, 0.48189544677734375, 0.50506591796875, 0.5282363891601562, 0.5514068603515625, 0.5745773315429688, 0.597747802734375, 0.6209182739257812, 0.6440887451171875, 0.6672592163085938, 0.6904296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 3.0, 6.0, 11.0, 15.0, 19.0, 19.0, 22.0, 30.0, 33.0, 34.0, 37.0, 56.0, 63.0, 49.0, 68.0, 62.0, 66.0, 60.0, 67.0, 39.0, 49.0, 38.0, 39.0, 26.0, 24.0, 15.0, 9.0, 9.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017576217651367188, -0.0016979724168777466, -0.0016383230686187744, -0.0015786737203598022, -0.00151902437210083, -0.001459375023841858, -0.0013997256755828857, -0.0013400763273239136, -0.0012804269790649414, -0.0012207776308059692, -0.001161128282546997, -0.001101478934288025, -0.0010418295860290527, -0.0009821802377700806, -0.0009225308895111084, -0.0008628815412521362, -0.0008032321929931641, -0.0007435828447341919, -0.0006839334964752197, -0.0006242841482162476, -0.0005646347999572754, -0.0005049854516983032, -0.00044533610343933105, -0.0003856867551803589, -0.0003260374069213867, -0.00026638805866241455, -0.00020673871040344238, -0.00014708936214447021, -8.744001388549805e-05, -2.779066562652588e-05, 3.185868263244629e-05, 9.150803089141846e-05, 0.00015115737915039062, 0.0002108067274093628, 0.00027045607566833496, 0.00033010542392730713, 0.0003897547721862793, 0.00044940412044525146, 0.0005090534687042236, 0.0005687028169631958, 0.000628352165222168, 0.0006880015134811401, 0.0007476508617401123, 0.0008073002099990845, 0.0008669495582580566, 0.0009265989065170288, 0.000986248254776001, 0.0010458976030349731, 0.0011055469512939453, 0.0011651962995529175, 0.0012248456478118896, 0.0012844949960708618, 0.001344144344329834, 0.0014037936925888062, 0.0014634430408477783, 0.0015230923891067505, 0.0015827417373657227, 0.0016423910856246948, 0.001702040433883667, 0.0017616897821426392, 0.0018213391304016113, 0.0018809884786605835, 0.0019406378269195557, 0.002000287175178528, 0.0020599365234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 18.0, 19.0, 31.0, 41.0, 60.0, 71.0, 116.0, 191.0, 360.0, 677.0, 3511.0, 663000.0, 376312.0, 2525.0, 646.0, 280.0, 192.0, 117.0, 73.0, 59.0, 34.0, 38.0, 29.0, 21.0, 17.0, 16.0, 13.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0394287109375, -0.03826713562011719, -0.037105560302734375, -0.03594398498535156, -0.03478240966796875, -0.03362083435058594, -0.032459259033203125, -0.03129768371582031, -0.0301361083984375, -0.028974533081054688, -0.027812957763671875, -0.026651382446289062, -0.02548980712890625, -0.024328231811523438, -0.023166656494140625, -0.022005081176757812, -0.020843505859375, -0.019681930541992188, -0.018520355224609375, -0.017358779907226562, -0.01619720458984375, -0.015035629272460938, -0.013874053955078125, -0.012712478637695312, -0.0115509033203125, -0.010389328002929688, -0.009227752685546875, -0.008066177368164062, -0.00690460205078125, -0.0057430267333984375, -0.004581451416015625, -0.0034198760986328125, -0.00225830078125, -0.0010967254638671875, 6.4849853515625e-05, 0.0012264251708984375, 0.00238800048828125, 0.0035495758056640625, 0.004711151123046875, 0.0058727264404296875, 0.0070343017578125, 0.008195877075195312, 0.009357452392578125, 0.010519027709960938, 0.01168060302734375, 0.012842178344726562, 0.014003753662109375, 0.015165328979492188, 0.016326904296875, 0.017488479614257812, 0.018650054931640625, 0.019811630249023438, 0.02097320556640625, 0.022134780883789062, 0.023296356201171875, 0.024457931518554688, 0.0256195068359375, 0.026781082153320312, 0.027942657470703125, 0.029104232788085938, 0.03026580810546875, 0.03142738342285156, 0.032588958740234375, 0.03375053405761719, 0.034912109375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 22.0, 93.0, 270.0, 350.0, 191.0, 66.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006533139385282993, -0.006395274773240089, -0.0062574101611971855, -0.006119545549154282, -0.00598168047145009, -0.0058438158594071865, -0.005705951247364283, -0.005568086635321379, -0.005430222023278475, -0.005292357411235571, -0.005154492799192667, -0.005016627721488476, -0.004878763109445572, -0.004740898497402668, -0.004603033885359764, -0.00446516927331686, -0.004327304661273956, -0.004189440049231052, -0.0040515754371881485, -0.003913710825145245, -0.003775845980271697, -0.0036379811353981495, -0.0035001165233552456, -0.0033622519113123417, -0.0032243868336081505, -0.0030865222215652466, -0.002948657376691699, -0.002810792764648795, -0.0026729281526058912, -0.0025350633077323437, -0.0023971986956894398, -0.002259334083646536, -0.0021214692387729883, -0.0019836046267300844, -0.0018457398982718587, -0.001707875169813633, -0.001570010557770729, -0.0014321458293125033, -0.0012942811008542776, -0.0011564164888113737, -0.001018551760353148, -0.0008806870901025832, -0.0007428224198520184, -0.0006049576913937926, -0.0004670930211432278, -0.000329228350892663, -0.00019136362243443727, -5.349895218387246e-05, 8.436571806669235e-05, 0.0002222304028691724, 0.00036009508767165244, 0.0004979597870260477, 0.0006358244572766125, 0.0007736891275271773, 0.0009115538559854031, 0.001049418468028307, 0.0011872831964865327, 0.0013251479249447584, 0.0014630125369876623, 0.001600877265445888, 0.0017387419939041138, 0.0018766066059470177, 0.0020144712179899216, 0.002152336062863469, 0.002290200674906373]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 9.0, 6.0, 13.0, 15.0, 19.0, 18.0, 25.0, 27.0, 33.0, 37.0, 38.0, 36.0, 50.0, 37.0, 46.0, 44.0, 60.0, 48.0, 60.0, 48.0, 36.0, 37.0, 31.0, 36.0, 42.0, 27.0, 29.0, 23.0, 14.0, 12.0, 14.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0012736916542053223, -0.0012402180582284927, -0.0012067444622516632, -0.0011732708662748337, -0.0011397972702980042, -0.0011063236743211746, -0.001072850078344345, -0.0010393764823675156, -0.001005902886390686, -0.0009724292904138565, -0.000938955694437027, -0.0009054820984601974, -0.0008720085024833679, -0.0008385349065065384, -0.0008050613105297089, -0.0007715877145528793, -0.0007381141185760498, -0.0007046405225992203, -0.0006711669266223907, -0.0006376933306455612, -0.0006042197346687317, -0.0005707461386919022, -0.0005372725427150726, -0.0005037989467382431, -0.0004703253507614136, -0.00043685175478458405, -0.0004033781588077545, -0.000369904562830925, -0.00033643096685409546, -0.00030295737087726593, -0.0002694837749004364, -0.00023601017892360687, -0.00020253658294677734, -0.00016906298696994781, -0.00013558939099311829, -0.00010211579501628876, -6.864219903945923e-05, -3.51686030626297e-05, -1.695007085800171e-06, 3.177858889102936e-05, 6.525218486785889e-05, 9.872578084468842e-05, 0.00013219937682151794, 0.00016567297279834747, 0.000199146568775177, 0.00023262016475200653, 0.00026609376072883606, 0.0002995673567056656, 0.0003330409526824951, 0.00036651454865932465, 0.0003999881446361542, 0.0004334617406129837, 0.00046693533658981323, 0.0005004089325666428, 0.0005338825285434723, 0.0005673561245203018, 0.0006008297204971313, 0.0006343033164739609, 0.0006677769124507904, 0.0007012505084276199, 0.0007347241044044495, 0.000768197700381279, 0.0008016712963581085, 0.000835144892334938, 0.0008686184883117676]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 15.0, 17.0, 17.0, 21.0, 29.0, 33.0, 32.0, 32.0, 40.0, 38.0, 46.0, 44.0, 42.0, 42.0, 51.0, 42.0, 46.0, 40.0, 44.0, 40.0, 35.0, 38.0, 38.0, 26.0, 26.0, 19.0, 15.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99505615234375, -4.8260498046875, -4.65704345703125, -4.488037109375, -4.31903076171875, -4.1500244140625, -3.98101806640625, -3.81201171875, -3.64300537109375, -3.4739990234375, -3.30499267578125, -3.135986328125, -2.96697998046875, -2.7979736328125, -2.62896728515625, -2.4599609375, -2.29095458984375, -2.1219482421875, -1.95294189453125, -1.783935546875, -1.61492919921875, -1.4459228515625, -1.27691650390625, -1.10791015625, -0.93890380859375, -0.7698974609375, -0.60089111328125, -0.431884765625, -0.26287841796875, -0.0938720703125, 0.07513427734375, 0.244140625, 0.41314697265625, 0.5821533203125, 0.75115966796875, 0.920166015625, 1.08917236328125, 1.2581787109375, 1.42718505859375, 1.59619140625, 1.76519775390625, 1.9342041015625, 2.10321044921875, 2.272216796875, 2.44122314453125, 2.6102294921875, 2.77923583984375, 2.9482421875, 3.11724853515625, 3.2862548828125, 3.45526123046875, 3.624267578125, 3.79327392578125, 3.9622802734375, 4.13128662109375, 4.30029296875, 4.46929931640625, 4.6383056640625, 4.80731201171875, 4.976318359375, 5.14532470703125, 5.3143310546875, 5.48333740234375, 5.65234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 8.0, 4.0, 17.0, 14.0, 29.0, 22.0, 60.0, 68.0, 124.0, 150.0, 259.0, 430.0, 723.0, 1161.0, 2214.0, 4652.0, 9282.0, 19245.0, 39847.0, 85007.0, 197958.0, 350414.0, 182708.0, 80820.0, 37225.0, 17993.0, 8699.0, 4274.0, 2160.0, 1161.0, 638.0, 401.0, 253.0, 148.0, 127.0, 94.0, 61.0, 29.0, 18.0, 17.0, 15.0, 10.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.40625, -3.304443359375, -3.20263671875, -3.100830078125, -2.9990234375, -2.897216796875, -2.79541015625, -2.693603515625, -2.591796875, -2.489990234375, -2.38818359375, -2.286376953125, -2.1845703125, -2.082763671875, -1.98095703125, -1.879150390625, -1.77734375, -1.675537109375, -1.57373046875, -1.471923828125, -1.3701171875, -1.268310546875, -1.16650390625, -1.064697265625, -0.962890625, -0.861083984375, -0.75927734375, -0.657470703125, -0.5556640625, -0.453857421875, -0.35205078125, -0.250244140625, -0.1484375, -0.046630859375, 0.05517578125, 0.156982421875, 0.2587890625, 0.360595703125, 0.46240234375, 0.564208984375, 0.666015625, 0.767822265625, 0.86962890625, 0.971435546875, 1.0732421875, 1.175048828125, 1.27685546875, 1.378662109375, 1.48046875, 1.582275390625, 1.68408203125, 1.785888671875, 1.8876953125, 1.989501953125, 2.09130859375, 2.193115234375, 2.294921875, 2.396728515625, 2.49853515625, 2.600341796875, 2.7021484375, 2.803955078125, 2.90576171875, 3.007568359375, 3.109375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 10.0, 8.0, 16.0, 18.0, 23.0, 24.0, 25.0, 31.0, 38.0, 37.0, 49.0, 51.0, 66.0, 101.0, 354.0, 1598.0, 142.0, 69.0, 54.0, 44.0, 32.0, 40.0, 34.0, 29.0, 22.0, 22.0, 15.0, 11.0, 8.0, 12.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.35546875, -19.7421875, -19.12890625, -18.515625, -17.90234375, -17.2890625, -16.67578125, -16.0625, -15.44921875, -14.8359375, -14.22265625, -13.609375, -12.99609375, -12.3828125, -11.76953125, -11.15625, -10.54296875, -9.9296875, -9.31640625, -8.703125, -8.08984375, -7.4765625, -6.86328125, -6.25, -5.63671875, -5.0234375, -4.41015625, -3.796875, -3.18359375, -2.5703125, -1.95703125, -1.34375, -0.73046875, -0.1171875, 0.49609375, 1.109375, 1.72265625, 2.3359375, 2.94921875, 3.5625, 4.17578125, 4.7890625, 5.40234375, 6.015625, 6.62890625, 7.2421875, 7.85546875, 8.46875, 9.08203125, 9.6953125, 10.30859375, 10.921875, 11.53515625, 12.1484375, 12.76171875, 13.375, 13.98828125, 14.6015625, 15.21484375, 15.828125, 16.44140625, 17.0546875, 17.66796875, 18.28125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 10.0, 11.0, 15.0, 12.0, 14.0, 17.0, 17.0, 37.0, 41.0, 67.0, 83.0, 125.0, 148.0, 212.0, 343.0, 922.0, 6851.0, 2998578.0, 134317.0, 2278.0, 538.0, 320.0, 206.0, 124.0, 95.0, 66.0, 60.0, 53.0, 30.0, 18.0, 25.0, 11.0, 14.0, 9.0, 11.0, 6.0, 6.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25, -39.865234375, -38.48046875, -37.095703125, -35.7109375, -34.326171875, -32.94140625, -31.556640625, -30.171875, -28.787109375, -27.40234375, -26.017578125, -24.6328125, -23.248046875, -21.86328125, -20.478515625, -19.09375, -17.708984375, -16.32421875, -14.939453125, -13.5546875, -12.169921875, -10.78515625, -9.400390625, -8.015625, -6.630859375, -5.24609375, -3.861328125, -2.4765625, -1.091796875, 0.29296875, 1.677734375, 3.0625, 4.447265625, 5.83203125, 7.216796875, 8.6015625, 9.986328125, 11.37109375, 12.755859375, 14.140625, 15.525390625, 16.91015625, 18.294921875, 19.6796875, 21.064453125, 22.44921875, 23.833984375, 25.21875, 26.603515625, 27.98828125, 29.373046875, 30.7578125, 32.142578125, 33.52734375, 34.912109375, 36.296875, 37.681640625, 39.06640625, 40.451171875, 41.8359375, 43.220703125, 44.60546875, 45.990234375, 47.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 8.0, 15.0, 24.0, 31.0, 40.0, 65.0, 98.0, 115.0, 121.0, 111.0, 103.0, 85.0, 70.0, 43.0, 29.0, 12.0, 14.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.285987854003906, -13.757482528686523, -13.22897720336914, -12.700471878051758, -12.171966552734375, -11.643461227416992, -11.114956855773926, -10.586451530456543, -10.05794620513916, -9.529440879821777, -9.000935554504395, -8.472430229187012, -7.943925380706787, -7.415420055389404, -6.88691520690918, -6.358409881591797, -5.829904556274414, -5.301399230957031, -4.772893905639648, -4.244389057159424, -3.715883731842041, -3.187378406524658, -2.6588733196258545, -2.130368232727051, -1.601862907409668, -1.0733577013015747, -0.5448524951934814, -0.016347289085388184, 0.5121579170227051, 1.040663242340088, 1.5691683292388916, 2.0976734161376953, 2.6261768341064453, 3.154682159423828, 3.683187246322632, 4.2116923332214355, 4.740197658538818, 5.268702983856201, 5.797207832336426, 6.325713157653809, 6.854218482971191, 7.382723808288574, 7.911229133605957, 8.43973445892334, 8.968238830566406, 9.496744155883789, 10.025249481201172, 10.553754806518555, 11.082260131835938, 11.61076545715332, 12.139270782470703, 12.667776107788086, 13.196281433105469, 13.724786758422852, 14.253291130065918, 14.7817964553833, 15.310301780700684, 15.838807106018066, 16.367311477661133, 16.895816802978516, 17.4243221282959, 17.95282745361328, 18.481332778930664, 19.009838104248047, 19.53834342956543]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 13.0, 16.0, 21.0, 16.0, 28.0, 27.0, 34.0, 36.0, 36.0, 39.0, 52.0, 50.0, 33.0, 47.0, 47.0, 51.0, 42.0, 48.0, 56.0, 42.0, 42.0, 36.0, 37.0, 22.0, 18.0, 28.0, 23.0, 7.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.11354064941406, -41.5509033203125, -39.98826599121094, -38.425628662109375, -36.86299133300781, -35.30035400390625, -33.73771667480469, -32.175079345703125, -30.612443923950195, -29.049806594848633, -27.48716926574707, -25.92453384399414, -24.361896514892578, -22.799259185791016, -21.236621856689453, -19.67398452758789, -18.111347198486328, -16.548709869384766, -14.986072540283203, -13.423436164855957, -11.860798835754395, -10.298161506652832, -8.735525131225586, -7.172887802124023, -5.610250473022461, -4.047613143920898, -2.484976291656494, -0.9223394393920898, 0.6402978897094727, 2.202935218811035, 3.7655715942382812, 5.328208923339844, 6.890850067138672, 8.453487396240234, 10.016124725341797, 11.578761100769043, 13.141398429870605, 14.704035758972168, 16.266672134399414, 17.829309463500977, 19.39194679260254, 20.9545841217041, 22.517221450805664, 24.079856872558594, 25.642494201660156, 27.20513153076172, 28.76776885986328, 30.330406188964844, 31.893043518066406, 33.45568084716797, 35.01831817626953, 36.580955505371094, 38.143592834472656, 39.70623016357422, 41.26886749267578, 42.831504821777344, 44.394142150878906, 45.95677947998047, 47.51941680908203, 49.082054138183594, 50.644691467285156, 52.20732879638672, 53.76996612548828, 55.332603454589844, 56.89523696899414]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 16.0, 19.0, 25.0, 22.0, 30.0, 33.0, 39.0, 36.0, 38.0, 37.0, 38.0, 53.0, 44.0, 40.0, 49.0, 45.0, 45.0, 37.0, 50.0, 36.0, 39.0, 40.0, 24.0, 25.0, 20.0, 18.0, 15.0, 18.0, 10.0, 13.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10015869140625, -4.9229736328125, -4.74578857421875, -4.568603515625, -4.39141845703125, -4.2142333984375, -4.03704833984375, -3.85986328125, -3.68267822265625, -3.5054931640625, -3.32830810546875, -3.151123046875, -2.97393798828125, -2.7967529296875, -2.61956787109375, -2.4423828125, -2.26519775390625, -2.0880126953125, -1.91082763671875, -1.733642578125, -1.55645751953125, -1.3792724609375, -1.20208740234375, -1.02490234375, -0.84771728515625, -0.6705322265625, -0.49334716796875, -0.316162109375, -0.13897705078125, 0.0382080078125, 0.21539306640625, 0.392578125, 0.56976318359375, 0.7469482421875, 0.92413330078125, 1.101318359375, 1.27850341796875, 1.4556884765625, 1.63287353515625, 1.81005859375, 1.98724365234375, 2.1644287109375, 2.34161376953125, 2.518798828125, 2.69598388671875, 2.8731689453125, 3.05035400390625, 3.2275390625, 3.40472412109375, 3.5819091796875, 3.75909423828125, 3.936279296875, 4.11346435546875, 4.2906494140625, 4.46783447265625, 4.64501953125, 4.82220458984375, 4.9993896484375, 5.17657470703125, 5.353759765625, 5.53094482421875, 5.7081298828125, 5.88531494140625, 6.0625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 9.0, 9.0, 19.0, 15.0, 18.0, 30.0, 20.0, 22.0, 35.0, 38.0, 36.0, 48.0, 102.0, 472.0, 4020.0, 104376.0, 3497289.0, 575300.0, 10971.0, 974.0, 139.0, 56.0, 45.0, 36.0, 37.0, 32.0, 30.0, 17.0, 19.0, 9.0, 14.0, 17.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.765380859375, -18.06201171875, -17.358642578125, -16.6552734375, -15.951904296875, -15.24853515625, -14.545166015625, -13.841796875, -13.138427734375, -12.43505859375, -11.731689453125, -11.0283203125, -10.324951171875, -9.62158203125, -8.918212890625, -8.21484375, -7.511474609375, -6.80810546875, -6.104736328125, -5.4013671875, -4.697998046875, -3.99462890625, -3.291259765625, -2.587890625, -1.884521484375, -1.18115234375, -0.477783203125, 0.2255859375, 0.928955078125, 1.63232421875, 2.335693359375, 3.0390625, 3.742431640625, 4.44580078125, 5.149169921875, 5.8525390625, 6.555908203125, 7.25927734375, 7.962646484375, 8.666015625, 9.369384765625, 10.07275390625, 10.776123046875, 11.4794921875, 12.182861328125, 12.88623046875, 13.589599609375, 14.29296875, 14.996337890625, 15.69970703125, 16.403076171875, 17.1064453125, 17.809814453125, 18.51318359375, 19.216552734375, 19.919921875, 20.623291015625, 21.32666015625, 22.030029296875, 22.7333984375, 23.436767578125, 24.14013671875, 24.843505859375, 25.546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 5.0, 5.0, 13.0, 28.0, 32.0, 36.0, 59.0, 65.0, 88.0, 101.0, 118.0, 185.0, 232.0, 276.0, 334.0, 418.0, 407.0, 384.0, 276.0, 233.0, 173.0, 121.0, 111.0, 97.0, 69.0, 58.0, 36.0, 20.0, 16.0, 16.0, 15.0, 12.0, 3.0, 2.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.90625, -10.6041259765625, -10.302001953125, -9.9998779296875, -9.69775390625, -9.3956298828125, -9.093505859375, -8.7913818359375, -8.4892578125, -8.1871337890625, -7.885009765625, -7.5828857421875, -7.28076171875, -6.9786376953125, -6.676513671875, -6.3743896484375, -6.072265625, -5.7701416015625, -5.468017578125, -5.1658935546875, -4.86376953125, -4.5616455078125, -4.259521484375, -3.9573974609375, -3.6552734375, -3.3531494140625, -3.051025390625, -2.7489013671875, -2.44677734375, -2.1446533203125, -1.842529296875, -1.5404052734375, -1.23828125, -0.9361572265625, -0.634033203125, -0.3319091796875, -0.02978515625, 0.2723388671875, 0.574462890625, 0.8765869140625, 1.1787109375, 1.4808349609375, 1.782958984375, 2.0850830078125, 2.38720703125, 2.6893310546875, 2.991455078125, 3.2935791015625, 3.595703125, 3.8978271484375, 4.199951171875, 4.5020751953125, 4.80419921875, 5.1063232421875, 5.408447265625, 5.7105712890625, 6.0126953125, 6.3148193359375, 6.616943359375, 6.9190673828125, 7.22119140625, 7.5233154296875, 7.825439453125, 8.1275634765625, 8.4296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 12.0, 13.0, 19.0, 31.0, 40.0, 32.0, 44.0, 61.0, 85.0, 121.0, 167.0, 239.0, 366.0, 1059.0, 10728.0, 1523143.0, 2639264.0, 16213.0, 1192.0, 444.0, 256.0, 190.0, 133.0, 112.0, 69.0, 54.0, 34.0, 26.0, 20.0, 23.0, 15.0, 12.0, 12.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.6875, -33.49365234375, -32.2998046875, -31.10595703125, -29.912109375, -28.71826171875, -27.5244140625, -26.33056640625, -25.13671875, -23.94287109375, -22.7490234375, -21.55517578125, -20.361328125, -19.16748046875, -17.9736328125, -16.77978515625, -15.5859375, -14.39208984375, -13.1982421875, -12.00439453125, -10.810546875, -9.61669921875, -8.4228515625, -7.22900390625, -6.03515625, -4.84130859375, -3.6474609375, -2.45361328125, -1.259765625, -0.06591796875, 1.1279296875, 2.32177734375, 3.515625, 4.70947265625, 5.9033203125, 7.09716796875, 8.291015625, 9.48486328125, 10.6787109375, 11.87255859375, 13.06640625, 14.26025390625, 15.4541015625, 16.64794921875, 17.841796875, 19.03564453125, 20.2294921875, 21.42333984375, 22.6171875, 23.81103515625, 25.0048828125, 26.19873046875, 27.392578125, 28.58642578125, 29.7802734375, 30.97412109375, 32.16796875, 33.36181640625, 34.5556640625, 35.74951171875, 36.943359375, 38.13720703125, 39.3310546875, 40.52490234375, 41.71875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 136.0, 400.0, 387.0, 84.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.9327507019043, -54.79733657836914, -48.66192626953125, -42.526512145996094, -36.39109802246094, -30.255687713623047, -24.12027359008789, -17.98486328125, -11.849449157714844, -5.714036464691162, 0.42137622833251953, 6.556789398193359, 12.692201614379883, 18.827613830566406, 24.963027954101562, 31.098438262939453, 37.23385238647461, 43.369266510009766, 49.504676818847656, 55.64009094238281, 61.77550506591797, 67.91091918945312, 74.04632568359375, 80.1817398071289, 86.31715393066406, 92.45256805419922, 98.58798217773438, 104.723388671875, 110.85880279541016, 116.99421691894531, 123.12963104248047, 129.26504516601562, 135.4004669189453, 141.53587341308594, 147.67129516601562, 153.80670166015625, 159.94212341308594, 166.07752990722656, 172.21295166015625, 178.34835815429688, 184.4837646484375, 190.61917114257812, 196.7545928955078, 202.88999938964844, 209.02542114257812, 215.16082763671875, 221.29623413085938, 227.43165588378906, 233.56707763671875, 239.70248413085938, 245.83790588378906, 251.9733123779297, 258.1087341308594, 264.244140625, 270.3795471191406, 276.51495361328125, 282.6503601074219, 288.7857666015625, 294.9211730957031, 301.0566101074219, 307.1920166015625, 313.3274230957031, 319.46282958984375, 325.5982360839844, 331.7336730957031]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 13.0, 9.0, 12.0, 19.0, 27.0, 22.0, 22.0, 29.0, 33.0, 27.0, 29.0, 32.0, 45.0, 45.0, 45.0, 50.0, 50.0, 43.0, 34.0, 40.0, 39.0, 31.0, 39.0, 35.0, 21.0, 19.0, 23.0, 24.0, 18.0, 15.0, 17.0, 15.0, 13.0, 11.0, 7.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-35.31499481201172, -34.24851608276367, -33.18203353881836, -32.11555480957031, -31.049074172973633, -29.982593536376953, -28.916114807128906, -27.849634170532227, -26.783153533935547, -25.716672897338867, -24.65019416809082, -23.58371353149414, -22.51723289489746, -21.45075225830078, -20.384273529052734, -19.317792892456055, -18.251314163208008, -17.184833526611328, -16.11835479736328, -15.051874160766602, -13.985393524169922, -12.918913841247559, -11.852434158325195, -10.785953521728516, -9.719473838806152, -8.652994155883789, -7.586513519287109, -6.520033836364746, -5.453553676605225, -4.387073516845703, -3.32059383392334, -2.2541136741638184, -1.1876335144042969, -0.12115347385406494, 0.945326566696167, 2.0118064880371094, 3.078286647796631, 4.144766807556152, 5.211246490478516, 6.277726650238037, 7.344206809997559, 8.410686492919922, 9.477167129516602, 10.543646812438965, 11.610126495361328, 12.676607131958008, 13.743086814880371, 14.809566497802734, 15.876047134399414, 16.942527770996094, 18.00900650024414, 19.07548713684082, 20.1419677734375, 21.208446502685547, 22.274927139282227, 23.341407775878906, 24.407886505126953, 25.474367141723633, 26.54084587097168, 27.60732650756836, 28.67380714416504, 29.74028778076172, 30.806766510009766, 31.873247146606445, 32.939727783203125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 4.0, 11.0, 10.0, 18.0, 25.0, 17.0, 20.0, 30.0, 36.0, 31.0, 47.0, 30.0, 35.0, 52.0, 51.0, 48.0, 40.0, 46.0, 38.0, 42.0, 44.0, 53.0, 35.0, 28.0, 28.0, 36.0, 30.0, 24.0, 20.0, 18.0, 12.0, 14.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69134521484375, -5.5115966796875, -5.33184814453125, -5.152099609375, -4.97235107421875, -4.7926025390625, -4.61285400390625, -4.43310546875, -4.25335693359375, -4.0736083984375, -3.89385986328125, -3.714111328125, -3.53436279296875, -3.3546142578125, -3.17486572265625, -2.9951171875, -2.81536865234375, -2.6356201171875, -2.45587158203125, -2.276123046875, -2.09637451171875, -1.9166259765625, -1.73687744140625, -1.55712890625, -1.37738037109375, -1.1976318359375, -1.01788330078125, -0.838134765625, -0.65838623046875, -0.4786376953125, -0.29888916015625, -0.119140625, 0.06060791015625, 0.2403564453125, 0.42010498046875, 0.599853515625, 0.77960205078125, 0.9593505859375, 1.13909912109375, 1.31884765625, 1.49859619140625, 1.6783447265625, 1.85809326171875, 2.037841796875, 2.21759033203125, 2.3973388671875, 2.57708740234375, 2.7568359375, 2.93658447265625, 3.1163330078125, 3.29608154296875, 3.475830078125, 3.65557861328125, 3.8353271484375, 4.01507568359375, 4.19482421875, 4.37457275390625, 4.5543212890625, 4.73406982421875, 4.913818359375, 5.09356689453125, 5.2733154296875, 5.45306396484375, 5.6328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 9.0, 15.0, 20.0, 23.0, 23.0, 52.0, 72.0, 111.0, 153.0, 238.0, 294.0, 480.0, 648.0, 986.0, 1384.0, 2024.0, 2940.0, 4248.0, 6210.0, 8900.0, 12948.0, 19150.0, 28483.0, 43178.0, 68363.0, 109443.0, 166293.0, 186960.0, 136546.0, 86206.0, 53897.0, 34797.0, 23162.0, 15783.0, 10860.0, 7272.0, 5048.0, 3519.0, 2399.0, 1699.0, 1132.0, 802.0, 553.0, 382.0, 269.0, 192.0, 126.0, 92.0, 48.0, 38.0, 33.0, 29.0, 10.0, 9.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5582046508789062, -0.5397491455078125, -0.5212936401367188, -0.502838134765625, -0.48438262939453125, -0.4659271240234375, -0.44747161865234375, -0.42901611328125, -0.41056060791015625, -0.3921051025390625, -0.37364959716796875, -0.355194091796875, -0.33673858642578125, -0.3182830810546875, -0.29982757568359375, -0.2813720703125, -0.26291656494140625, -0.2444610595703125, -0.22600555419921875, -0.207550048828125, -0.18909454345703125, -0.1706390380859375, -0.15218353271484375, -0.13372802734375, -0.11527252197265625, -0.0968170166015625, -0.07836151123046875, -0.059906005859375, -0.04145050048828125, -0.0229949951171875, -0.00453948974609375, 0.013916015625, 0.03237152099609375, 0.0508270263671875, 0.06928253173828125, 0.087738037109375, 0.10619354248046875, 0.1246490478515625, 0.14310455322265625, 0.16156005859375, 0.18001556396484375, 0.1984710693359375, 0.21692657470703125, 0.235382080078125, 0.25383758544921875, 0.2722930908203125, 0.29074859619140625, 0.3092041015625, 0.32765960693359375, 0.3461151123046875, 0.36457061767578125, 0.383026123046875, 0.40148162841796875, 0.4199371337890625, 0.43839263916015625, 0.45684814453125, 0.47530364990234375, 0.4937591552734375, 0.5122146606445312, 0.530670166015625, 0.5491256713867188, 0.5675811767578125, 0.5860366821289062, 0.6044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 8.0, 11.0, 15.0, 23.0, 14.0, 19.0, 20.0, 29.0, 19.0, 27.0, 32.0, 49.0, 24.0, 38.0, 45.0, 47.0, 1066.0, 50.0, 43.0, 49.0, 45.0, 39.0, 30.0, 33.0, 29.0, 29.0, 23.0, 30.0, 19.0, 19.0, 8.0, 8.0, 13.0, 8.0, 12.0, 6.0, 8.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.08984375, -2.986602783203125, -2.88336181640625, -2.780120849609375, -2.6768798828125, -2.573638916015625, -2.47039794921875, -2.367156982421875, -2.263916015625, -2.160675048828125, -2.05743408203125, -1.954193115234375, -1.8509521484375, -1.747711181640625, -1.64447021484375, -1.541229248046875, -1.43798828125, -1.334747314453125, -1.23150634765625, -1.128265380859375, -1.0250244140625, -0.921783447265625, -0.81854248046875, -0.715301513671875, -0.612060546875, -0.508819580078125, -0.40557861328125, -0.302337646484375, -0.1990966796875, -0.095855712890625, 0.00738525390625, 0.110626220703125, 0.2138671875, 0.317108154296875, 0.42034912109375, 0.523590087890625, 0.6268310546875, 0.730072021484375, 0.83331298828125, 0.936553955078125, 1.039794921875, 1.143035888671875, 1.24627685546875, 1.349517822265625, 1.4527587890625, 1.555999755859375, 1.65924072265625, 1.762481689453125, 1.86572265625, 1.968963623046875, 2.07220458984375, 2.175445556640625, 2.2786865234375, 2.381927490234375, 2.48516845703125, 2.588409423828125, 2.691650390625, 2.794891357421875, 2.89813232421875, 3.001373291015625, 3.1046142578125, 3.207855224609375, 3.31109619140625, 3.414337158203125, 3.517578125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 7.0, 10.0, 24.0, 28.0, 42.0, 68.0, 102.0, 140.0, 208.0, 330.0, 495.0, 800.0, 1201.0, 1952.0, 3057.0, 4865.0, 7992.0, 12920.0, 21750.0, 38247.0, 68320.0, 126175.0, 213037.0, 1271163.0, 142384.0, 77031.0, 42312.0, 24680.0, 14365.0, 8763.0, 5327.0, 3283.0, 2164.0, 1379.0, 870.0, 562.0, 362.0, 250.0, 160.0, 91.0, 80.0, 36.0, 29.0, 16.0, 13.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5576171875, -0.5402450561523438, -0.5228729248046875, -0.5055007934570312, -0.488128662109375, -0.47075653076171875, -0.4533843994140625, -0.43601226806640625, -0.41864013671875, -0.40126800537109375, -0.3838958740234375, -0.36652374267578125, -0.349151611328125, -0.33177947998046875, -0.3144073486328125, -0.29703521728515625, -0.2796630859375, -0.26229095458984375, -0.2449188232421875, -0.22754669189453125, -0.210174560546875, -0.19280242919921875, -0.1754302978515625, -0.15805816650390625, -0.14068603515625, -0.12331390380859375, -0.1059417724609375, -0.08856964111328125, -0.071197509765625, -0.05382537841796875, -0.0364532470703125, -0.01908111572265625, -0.001708984375, 0.01566314697265625, 0.0330352783203125, 0.05040740966796875, 0.067779541015625, 0.08515167236328125, 0.1025238037109375, 0.11989593505859375, 0.13726806640625, 0.15464019775390625, 0.1720123291015625, 0.18938446044921875, 0.206756591796875, 0.22412872314453125, 0.2415008544921875, 0.25887298583984375, 0.2762451171875, 0.29361724853515625, 0.3109893798828125, 0.32836151123046875, 0.345733642578125, 0.36310577392578125, 0.3804779052734375, 0.39785003662109375, 0.41522216796875, 0.43259429931640625, 0.4499664306640625, 0.46733856201171875, 0.484710693359375, 0.5020828247070312, 0.5194549560546875, 0.5368270874023438, 0.55419921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 4.0, 3.0, 2.0, 1.0, 10.0, 10.0, 8.0, 14.0, 23.0, 26.0, 38.0, 46.0, 45.0, 63.0, 54.0, 57.0, 83.0, 80.0, 65.0, 75.0, 68.0, 53.0, 37.0, 24.0, 23.0, 18.0, 13.0, 9.0, 13.0, 10.0, 9.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001983642578125, -0.0019269287586212158, -0.0018702149391174316, -0.0018135011196136475, -0.0017567873001098633, -0.001700073480606079, -0.001643359661102295, -0.0015866458415985107, -0.0015299320220947266, -0.0014732182025909424, -0.0014165043830871582, -0.001359790563583374, -0.0013030767440795898, -0.0012463629245758057, -0.0011896491050720215, -0.0011329352855682373, -0.0010762214660644531, -0.001019507646560669, -0.0009627938270568848, -0.0009060800075531006, -0.0008493661880493164, -0.0007926523685455322, -0.000735938549041748, -0.0006792247295379639, -0.0006225109100341797, -0.0005657970905303955, -0.0005090832710266113, -0.00045236945152282715, -0.00039565563201904297, -0.0003389418125152588, -0.0002822279930114746, -0.00022551417350769043, -0.00016880035400390625, -0.00011208653450012207, -5.537271499633789e-05, 1.341104507446289e-06, 5.805492401123047e-05, 0.00011476874351501465, 0.00017148256301879883, 0.000228196382522583, 0.0002849102020263672, 0.00034162402153015137, 0.00039833784103393555, 0.0004550516605377197, 0.0005117654800415039, 0.0005684792995452881, 0.0006251931190490723, 0.0006819069385528564, 0.0007386207580566406, 0.0007953345775604248, 0.000852048397064209, 0.0009087622165679932, 0.0009654760360717773, 0.0010221898555755615, 0.0010789036750793457, 0.0011356174945831299, 0.001192331314086914, 0.0012490451335906982, 0.0013057589530944824, 0.0013624727725982666, 0.0014191865921020508, 0.001475900411605835, 0.0015326142311096191, 0.0015893280506134033, 0.0016460418701171875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 13.0, 15.0, 6.0, 18.0, 17.0, 29.0, 32.0, 52.0, 72.0, 90.0, 161.0, 239.0, 447.0, 1373.0, 48974.0, 986823.0, 8276.0, 842.0, 370.0, 220.0, 137.0, 100.0, 59.0, 49.0, 30.0, 31.0, 15.0, 10.0, 13.0, 8.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03563642501831055, -0.034499168395996094, -0.03336191177368164, -0.03222465515136719, -0.031087398529052734, -0.02995014190673828, -0.028812885284423828, -0.027675628662109375, -0.026538372039794922, -0.02540111541748047, -0.024263858795166016, -0.023126602172851562, -0.02198934555053711, -0.020852088928222656, -0.019714832305908203, -0.01857757568359375, -0.017440319061279297, -0.016303062438964844, -0.01516580581665039, -0.014028549194335938, -0.012891292572021484, -0.011754035949707031, -0.010616779327392578, -0.009479522705078125, -0.008342266082763672, -0.007205009460449219, -0.006067752838134766, -0.0049304962158203125, -0.0037932395935058594, -0.0026559829711914062, -0.0015187263488769531, -0.0003814697265625, 0.0007557868957519531, 0.0018930435180664062, 0.0030303001403808594, 0.0041675567626953125, 0.005304813385009766, 0.006442070007324219, 0.007579326629638672, 0.008716583251953125, 0.009853839874267578, 0.010991096496582031, 0.012128353118896484, 0.013265609741210938, 0.01440286636352539, 0.015540122985839844, 0.016677379608154297, 0.01781463623046875, 0.018951892852783203, 0.020089149475097656, 0.02122640609741211, 0.022363662719726562, 0.023500919342041016, 0.02463817596435547, 0.025775432586669922, 0.026912689208984375, 0.028049945831298828, 0.02918720245361328, 0.030324459075927734, 0.03146171569824219, 0.03259897232055664, 0.033736228942871094, 0.03487348556518555, 0.0360107421875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 461.0, 539.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02173800580203533, -0.021312225610017776, -0.02088644541800022, -0.020460665225982666, -0.02003488503396511, -0.019609104841947556, -0.01918332278728485, -0.018757542595267296, -0.01833176240324974, -0.017905982211232185, -0.01748020201921463, -0.017054421827197075, -0.01662864163517952, -0.016202859580516815, -0.01577708125114441, -0.01535130012780428, -0.014925519935786724, -0.014499739743769169, -0.014073959551751614, -0.013648178428411484, -0.013222398236393929, -0.012796618044376373, -0.012370837852358818, -0.011945057660341263, -0.011519277468323708, -0.011093497276306152, -0.010667717084288597, -0.010241936892271042, -0.009816155768930912, -0.009390375576913357, -0.008964595384895802, -0.008538815192878246, -0.008113034069538116, -0.007687253877520561, -0.007261473219841719, -0.0068356930278241634, -0.006409912370145321, -0.005984132178127766, -0.00555835198611021, -0.005132571794092655, -0.004706791136413813, -0.004281010944396257, -0.003855230286717415, -0.0034294500946998596, -0.0030036696698516607, -0.002577889245003462, -0.0021521090529859066, -0.0017263286281377077, -0.0013005482032895088, -0.0008747678366489708, -0.00044898747000843287, -2.32071615755558e-05, 0.0004025732632726431, 0.000828353688120842, 0.0012541338801383972, 0.001679914304986596, 0.002105694729834795, 0.002531475154682994, 0.0029572555795311928, 0.003383035771548748, 0.003808816196396947, 0.004234596621245146, 0.004660376813262701, 0.005086157470941544, 0.005511937662959099]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 10.0, 10.0, 10.0, 14.0, 22.0, 33.0, 31.0, 36.0, 35.0, 48.0, 49.0, 62.0, 61.0, 48.0, 68.0, 53.0, 54.0, 51.0, 62.0, 44.0, 45.0, 35.0, 25.0, 19.0, 19.0, 18.0, 10.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000890195369720459, -0.0008535804226994514, -0.0008169654756784439, -0.0007803505286574364, -0.0007437355816364288, -0.0007071206346154213, -0.0006705056875944138, -0.0006338907405734062, -0.0005972757935523987, -0.0005606608465313911, -0.0005240458995103836, -0.00048743095248937607, -0.00045081600546836853, -0.000414201058447361, -0.00037758611142635345, -0.0003409711644053459, -0.0003043562173843384, -0.00026774127036333084, -0.0002311263233423233, -0.00019451137632131577, -0.00015789642930030823, -0.00012128148227930069, -8.466653525829315e-05, -4.8051588237285614e-05, -1.1436641216278076e-05, 2.517830580472946e-05, 6.1793252825737e-05, 9.840819984674454e-05, 0.00013502314686775208, 0.0001716380938887596, 0.00020825304090976715, 0.0002448679879307747, 0.0002814829349517822, 0.00031809788197278976, 0.0003547128289937973, 0.00039132777601480484, 0.0004279427230358124, 0.0004645576700568199, 0.0005011726170778275, 0.000537787564098835, 0.0005744025111198425, 0.0006110174581408501, 0.0006476324051618576, 0.0006842473521828651, 0.0007208622992038727, 0.0007574772462248802, 0.0007940921932458878, 0.0008307071402668953, 0.0008673220872879028, 0.0009039370343089104, 0.0009405519813299179, 0.0009771669283509254, 0.001013781875371933, 0.0010503968223929405, 0.001087011769413948, 0.0011236267164349556, 0.0011602416634559631, 0.0011968566104769707, 0.0012334715574979782, 0.0012700865045189857, 0.0013067014515399933, 0.0013433163985610008, 0.0013799313455820084, 0.001416546292603016, 0.0014531612396240234]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 4.0, 11.0, 10.0, 18.0, 25.0, 17.0, 20.0, 30.0, 36.0, 31.0, 47.0, 30.0, 35.0, 52.0, 51.0, 48.0, 40.0, 46.0, 38.0, 42.0, 44.0, 53.0, 35.0, 28.0, 28.0, 36.0, 30.0, 24.0, 20.0, 18.0, 12.0, 14.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69134521484375, -5.5115966796875, -5.33184814453125, -5.152099609375, -4.97235107421875, -4.7926025390625, -4.61285400390625, -4.43310546875, -4.25335693359375, -4.0736083984375, -3.89385986328125, -3.714111328125, -3.53436279296875, -3.3546142578125, -3.17486572265625, -2.9951171875, -2.81536865234375, -2.6356201171875, -2.45587158203125, -2.276123046875, -2.09637451171875, -1.9166259765625, -1.73687744140625, -1.55712890625, -1.37738037109375, -1.1976318359375, -1.01788330078125, -0.838134765625, -0.65838623046875, -0.4786376953125, -0.29888916015625, -0.119140625, 0.06060791015625, 0.2403564453125, 0.42010498046875, 0.599853515625, 0.77960205078125, 0.9593505859375, 1.13909912109375, 1.31884765625, 1.49859619140625, 1.6783447265625, 1.85809326171875, 2.037841796875, 2.21759033203125, 2.3973388671875, 2.57708740234375, 2.7568359375, 2.93658447265625, 3.1163330078125, 3.29608154296875, 3.475830078125, 3.65557861328125, 3.8353271484375, 4.01507568359375, 4.19482421875, 4.37457275390625, 4.5543212890625, 4.73406982421875, 4.913818359375, 5.09356689453125, 5.2733154296875, 5.45306396484375, 5.6328125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 9.0, 12.0, 16.0, 21.0, 32.0, 41.0, 71.0, 90.0, 124.0, 179.0, 326.0, 624.0, 1071.0, 1961.0, 4085.0, 8629.0, 18704.0, 42999.0, 98098.0, 236251.0, 372985.0, 145431.0, 64077.0, 28148.0, 12520.0, 5856.0, 2826.0, 1405.0, 717.0, 444.0, 276.0, 143.0, 111.0, 74.0, 48.0, 39.0, 32.0, 23.0, 16.0, 17.0, 11.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.248291015625, -3.13720703125, -3.026123046875, -2.9150390625, -2.803955078125, -2.69287109375, -2.581787109375, -2.470703125, -2.359619140625, -2.24853515625, -2.137451171875, -2.0263671875, -1.915283203125, -1.80419921875, -1.693115234375, -1.58203125, -1.470947265625, -1.35986328125, -1.248779296875, -1.1376953125, -1.026611328125, -0.91552734375, -0.804443359375, -0.693359375, -0.582275390625, -0.47119140625, -0.360107421875, -0.2490234375, -0.137939453125, -0.02685546875, 0.084228515625, 0.1953125, 0.306396484375, 0.41748046875, 0.528564453125, 0.6396484375, 0.750732421875, 0.86181640625, 0.972900390625, 1.083984375, 1.195068359375, 1.30615234375, 1.417236328125, 1.5283203125, 1.639404296875, 1.75048828125, 1.861572265625, 1.97265625, 2.083740234375, 2.19482421875, 2.305908203125, 2.4169921875, 2.528076171875, 2.63916015625, 2.750244140625, 2.861328125, 2.972412109375, 3.08349609375, 3.194580078125, 3.3056640625, 3.416748046875, 3.52783203125, 3.638916015625, 3.75]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 8.0, 8.0, 7.0, 12.0, 13.0, 22.0, 18.0, 20.0, 25.0, 29.0, 26.0, 31.0, 33.0, 41.0, 39.0, 51.0, 86.0, 213.0, 1619.0, 215.0, 85.0, 55.0, 39.0, 44.0, 40.0, 43.0, 32.0, 31.0, 22.0, 19.0, 20.0, 11.0, 11.0, 14.0, 13.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.82763671875, -18.3115234375, -17.79541015625, -17.279296875, -16.76318359375, -16.2470703125, -15.73095703125, -15.21484375, -14.69873046875, -14.1826171875, -13.66650390625, -13.150390625, -12.63427734375, -12.1181640625, -11.60205078125, -11.0859375, -10.56982421875, -10.0537109375, -9.53759765625, -9.021484375, -8.50537109375, -7.9892578125, -7.47314453125, -6.95703125, -6.44091796875, -5.9248046875, -5.40869140625, -4.892578125, -4.37646484375, -3.8603515625, -3.34423828125, -2.828125, -2.31201171875, -1.7958984375, -1.27978515625, -0.763671875, -0.24755859375, 0.2685546875, 0.78466796875, 1.30078125, 1.81689453125, 2.3330078125, 2.84912109375, 3.365234375, 3.88134765625, 4.3974609375, 4.91357421875, 5.4296875, 5.94580078125, 6.4619140625, 6.97802734375, 7.494140625, 8.01025390625, 8.5263671875, 9.04248046875, 9.55859375, 10.07470703125, 10.5908203125, 11.10693359375, 11.623046875, 12.13916015625, 12.6552734375, 13.17138671875, 13.6875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 7.0, 6.0, 9.0, 15.0, 11.0, 25.0, 24.0, 24.0, 44.0, 43.0, 75.0, 99.0, 122.0, 174.0, 214.0, 283.0, 591.0, 2575.0, 341800.0, 2792408.0, 5004.0, 764.0, 343.0, 249.0, 171.0, 121.0, 102.0, 80.0, 57.0, 51.0, 31.0, 37.0, 30.0, 20.0, 10.0, 21.0, 15.0, 9.0, 6.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.875, -32.7119140625, -31.548828125, -30.3857421875, -29.22265625, -28.0595703125, -26.896484375, -25.7333984375, -24.5703125, -23.4072265625, -22.244140625, -21.0810546875, -19.91796875, -18.7548828125, -17.591796875, -16.4287109375, -15.265625, -14.1025390625, -12.939453125, -11.7763671875, -10.61328125, -9.4501953125, -8.287109375, -7.1240234375, -5.9609375, -4.7978515625, -3.634765625, -2.4716796875, -1.30859375, -0.1455078125, 1.017578125, 2.1806640625, 3.34375, 4.5068359375, 5.669921875, 6.8330078125, 7.99609375, 9.1591796875, 10.322265625, 11.4853515625, 12.6484375, 13.8115234375, 14.974609375, 16.1376953125, 17.30078125, 18.4638671875, 19.626953125, 20.7900390625, 21.953125, 23.1162109375, 24.279296875, 25.4423828125, 26.60546875, 27.7685546875, 28.931640625, 30.0947265625, 31.2578125, 32.4208984375, 33.583984375, 34.7470703125, 35.91015625, 37.0732421875, 38.236328125, 39.3994140625, 40.5625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 338.0, 623.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.69039916992188, -188.60650634765625, -184.5226287841797, -180.43873596191406, -176.3548583984375, -172.27096557617188, -168.1870880126953, -164.1031951904297, -160.01931762695312, -155.9354248046875, -151.85154724121094, -147.7676544189453, -143.68377685546875, -139.59988403320312, -135.51600646972656, -131.43211364746094, -127.34822845458984, -123.26434326171875, -119.18045806884766, -115.09657287597656, -111.01268768310547, -106.92880249023438, -102.84490966796875, -98.76103210449219, -94.67713928222656, -90.59325408935547, -86.50936889648438, -82.42548370361328, -78.34159851074219, -74.2577133178711, -70.173828125, -66.08993530273438, -62.00605010986328, -57.92216491699219, -53.838279724121094, -49.75439453125, -45.670509338378906, -41.58662414550781, -37.50273513793945, -33.41884994506836, -29.334964752197266, -25.251079559326172, -21.167194366455078, -17.08330726623535, -12.999422073364258, -8.915536880493164, -4.8316497802734375, -0.7477645874023438, 3.33612060546875, 7.420006275177002, 11.503891944885254, 15.587778091430664, 19.671663284301758, 23.75554847717285, 27.839435577392578, 31.923320770263672, 36.007205963134766, 40.09109115600586, 44.17497634887695, 48.25886535644531, 52.342750549316406, 56.4266357421875, 60.510520935058594, 64.59440612792969, 68.67829132080078]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 13.0, 6.0, 8.0, 9.0, 14.0, 15.0, 21.0, 28.0, 28.0, 26.0, 35.0, 27.0, 39.0, 27.0, 36.0, 45.0, 35.0, 53.0, 53.0, 31.0, 51.0, 47.0, 36.0, 34.0, 38.0, 22.0, 23.0, 22.0, 28.0, 20.0, 23.0, 13.0, 13.0, 13.0, 14.0, 10.0, 5.0, 4.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-52.956687927246094, -51.42449188232422, -49.892295837402344, -48.36009979248047, -46.82790756225586, -45.295711517333984, -43.76351547241211, -42.231319427490234, -40.699127197265625, -39.16693115234375, -37.634735107421875, -36.1025390625, -34.57034683227539, -33.038150787353516, -31.50595474243164, -29.973758697509766, -28.44156265258789, -26.909366607666016, -25.377172470092773, -23.8449764251709, -22.312782287597656, -20.78058624267578, -19.248390197753906, -17.71619415283203, -16.18400001525879, -14.65180492401123, -13.119609832763672, -11.587413787841797, -10.055218696594238, -8.52302360534668, -6.990827560424805, -5.458632469177246, -3.926433563232422, -2.394238233566284, -0.8620429039001465, 0.6701526641845703, 2.202347755432129, 3.7345428466796875, 5.2667388916015625, 6.798933982849121, 8.33112907409668, 9.863324165344238, 11.395519256591797, 12.927715301513672, 14.45991039276123, 15.992105484008789, 17.524301528930664, 19.056495666503906, 20.58869171142578, 22.120887756347656, 23.6530818939209, 25.185277938842773, 26.717472076416016, 28.24966812133789, 29.781864166259766, 31.31406021118164, 32.84625244140625, 34.378448486328125, 35.91064453125, 37.442840576171875, 38.975032806396484, 40.50722885131836, 42.039424896240234, 43.57162094116211, 45.103816986083984]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 1.0, 11.0, 5.0, 10.0, 13.0, 15.0, 22.0, 21.0, 27.0, 26.0, 37.0, 27.0, 37.0, 36.0, 43.0, 54.0, 46.0, 41.0, 41.0, 39.0, 35.0, 39.0, 42.0, 50.0, 36.0, 23.0, 30.0, 38.0, 27.0, 18.0, 25.0, 16.0, 16.0, 16.0, 12.0, 11.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.72216796875, -5.5419921875, -5.36181640625, -5.181640625, -5.00146484375, -4.8212890625, -4.64111328125, -4.4609375, -4.28076171875, -4.1005859375, -3.92041015625, -3.740234375, -3.56005859375, -3.3798828125, -3.19970703125, -3.01953125, -2.83935546875, -2.6591796875, -2.47900390625, -2.298828125, -2.11865234375, -1.9384765625, -1.75830078125, -1.578125, -1.39794921875, -1.2177734375, -1.03759765625, -0.857421875, -0.67724609375, -0.4970703125, -0.31689453125, -0.13671875, 0.04345703125, 0.2236328125, 0.40380859375, 0.583984375, 0.76416015625, 0.9443359375, 1.12451171875, 1.3046875, 1.48486328125, 1.6650390625, 1.84521484375, 2.025390625, 2.20556640625, 2.3857421875, 2.56591796875, 2.74609375, 2.92626953125, 3.1064453125, 3.28662109375, 3.466796875, 3.64697265625, 3.8271484375, 4.00732421875, 4.1875, 4.36767578125, 4.5478515625, 4.72802734375, 4.908203125, 5.08837890625, 5.2685546875, 5.44873046875, 5.62890625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 12.0, 12.0, 8.0, 19.0, 24.0, 21.0, 24.0, 28.0, 34.0, 47.0, 71.0, 107.0, 326.0, 1133.0, 7504.0, 179030.0, 3376288.0, 611000.0, 15817.0, 1806.0, 452.0, 166.0, 64.0, 44.0, 39.0, 28.0, 18.0, 27.0, 20.0, 21.0, 15.0, 22.0, 12.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.77294921875, -18.1396484375, -17.50634765625, -16.873046875, -16.23974609375, -15.6064453125, -14.97314453125, -14.33984375, -13.70654296875, -13.0732421875, -12.43994140625, -11.806640625, -11.17333984375, -10.5400390625, -9.90673828125, -9.2734375, -8.64013671875, -8.0068359375, -7.37353515625, -6.740234375, -6.10693359375, -5.4736328125, -4.84033203125, -4.20703125, -3.57373046875, -2.9404296875, -2.30712890625, -1.673828125, -1.04052734375, -0.4072265625, 0.22607421875, 0.859375, 1.49267578125, 2.1259765625, 2.75927734375, 3.392578125, 4.02587890625, 4.6591796875, 5.29248046875, 5.92578125, 6.55908203125, 7.1923828125, 7.82568359375, 8.458984375, 9.09228515625, 9.7255859375, 10.35888671875, 10.9921875, 11.62548828125, 12.2587890625, 12.89208984375, 13.525390625, 14.15869140625, 14.7919921875, 15.42529296875, 16.05859375, 16.69189453125, 17.3251953125, 17.95849609375, 18.591796875, 19.22509765625, 19.8583984375, 20.49169921875, 21.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 7.0, 9.0, 19.0, 13.0, 21.0, 20.0, 29.0, 38.0, 64.0, 77.0, 84.0, 110.0, 173.0, 207.0, 249.0, 318.0, 399.0, 409.0, 371.0, 342.0, 302.0, 192.0, 136.0, 118.0, 89.0, 72.0, 44.0, 29.0, 26.0, 28.0, 17.0, 19.0, 7.0, 4.0, 4.0, 9.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.45703125, -8.1484375, -7.83984375, -7.53125, -7.22265625, -6.9140625, -6.60546875, -6.296875, -5.98828125, -5.6796875, -5.37109375, -5.0625, -4.75390625, -4.4453125, -4.13671875, -3.828125, -3.51953125, -3.2109375, -2.90234375, -2.59375, -2.28515625, -1.9765625, -1.66796875, -1.359375, -1.05078125, -0.7421875, -0.43359375, -0.125, 0.18359375, 0.4921875, 0.80078125, 1.109375, 1.41796875, 1.7265625, 2.03515625, 2.34375, 2.65234375, 2.9609375, 3.26953125, 3.578125, 3.88671875, 4.1953125, 4.50390625, 4.8125, 5.12109375, 5.4296875, 5.73828125, 6.046875, 6.35546875, 6.6640625, 6.97265625, 7.28125, 7.58984375, 7.8984375, 8.20703125, 8.515625, 8.82421875, 9.1328125, 9.44140625, 9.75, 10.05859375, 10.3671875, 10.67578125, 10.984375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 8.0, 11.0, 12.0, 20.0, 35.0, 41.0, 45.0, 68.0, 76.0, 106.0, 130.0, 160.0, 233.0, 285.0, 502.0, 1429.0, 37221.0, 3746124.0, 401274.0, 4369.0, 610.0, 374.0, 242.0, 179.0, 148.0, 118.0, 107.0, 59.0, 51.0, 49.0, 34.0, 26.0, 28.0, 19.0, 17.0, 10.0, 9.0, 9.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-38.1875, -36.98388671875, -35.7802734375, -34.57666015625, -33.373046875, -32.16943359375, -30.9658203125, -29.76220703125, -28.55859375, -27.35498046875, -26.1513671875, -24.94775390625, -23.744140625, -22.54052734375, -21.3369140625, -20.13330078125, -18.9296875, -17.72607421875, -16.5224609375, -15.31884765625, -14.115234375, -12.91162109375, -11.7080078125, -10.50439453125, -9.30078125, -8.09716796875, -6.8935546875, -5.68994140625, -4.486328125, -3.28271484375, -2.0791015625, -0.87548828125, 0.328125, 1.53173828125, 2.7353515625, 3.93896484375, 5.142578125, 6.34619140625, 7.5498046875, 8.75341796875, 9.95703125, 11.16064453125, 12.3642578125, 13.56787109375, 14.771484375, 15.97509765625, 17.1787109375, 18.38232421875, 19.5859375, 20.78955078125, 21.9931640625, 23.19677734375, 24.400390625, 25.60400390625, 26.8076171875, 28.01123046875, 29.21484375, 30.41845703125, 31.6220703125, 32.82568359375, 34.029296875, 35.23291015625, 36.4365234375, 37.64013671875, 38.84375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 58.0, 220.0, 378.0, 259.0, 80.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.08834075927734, -69.35191345214844, -64.61548614501953, -59.87905502319336, -55.14262771606445, -50.40620040893555, -45.669769287109375, -40.93334197998047, -36.19691467285156, -31.460487365722656, -26.724058151245117, -21.987628936767578, -17.251201629638672, -12.514774322509766, -7.778345108032227, -3.0419158935546875, 1.6945114135742188, 6.430939674377441, 11.167367935180664, 15.903796195983887, 20.64022445678711, 25.376651763916016, 30.113080978393555, 34.849510192871094, 39.5859375, 44.322364807128906, 49.05879211425781, 53.795223236083984, 58.53165054321289, 63.2680778503418, 68.00450897216797, 72.74093627929688, 77.47737121582031, 82.21379852294922, 86.95022583007812, 91.68665313720703, 96.42308044433594, 101.15951538085938, 105.89594268798828, 110.63236999511719, 115.3687973022461, 120.105224609375, 124.8416519165039, 129.5780792236328, 134.31451416015625, 139.05093383789062, 143.78736877441406, 148.5238037109375, 153.26022338867188, 157.9966583251953, 162.7330780029297, 167.46951293945312, 172.2059326171875, 176.94236755371094, 181.6787872314453, 186.41522216796875, 191.15164184570312, 195.88807678222656, 200.62449645996094, 205.36093139648438, 210.09735107421875, 214.8337860107422, 219.57020568847656, 224.306640625, 229.04307556152344]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 9.0, 6.0, 7.0, 6.0, 5.0, 13.0, 13.0, 18.0, 9.0, 22.0, 21.0, 16.0, 41.0, 28.0, 34.0, 20.0, 35.0, 31.0, 30.0, 32.0, 35.0, 30.0, 44.0, 33.0, 35.0, 35.0, 39.0, 36.0, 27.0, 37.0, 35.0, 25.0, 27.0, 31.0, 17.0, 10.0, 15.0, 19.0, 10.0, 11.0, 9.0, 13.0, 7.0, 5.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-31.401290893554688, -30.431167602539062, -29.461044311523438, -28.49091911315918, -27.520795822143555, -26.55067253112793, -25.580547332763672, -24.610424041748047, -23.640300750732422, -22.670177459716797, -21.700054168701172, -20.729928970336914, -19.75980567932129, -18.789682388305664, -17.819557189941406, -16.84943389892578, -15.879310607910156, -14.909187316894531, -13.93906307220459, -12.968938827514648, -11.998815536499023, -11.028692245483398, -10.058568000793457, -9.088443756103516, -8.11832046508789, -7.148196697235107, -6.178072929382324, -5.207949161529541, -4.237825393676758, -3.2677016258239746, -2.2975778579711914, -1.3274540901184082, -0.357330322265625, 0.6127934455871582, 1.5829172134399414, 2.5530409812927246, 3.523164749145508, 4.493288516998291, 5.463412284851074, 6.433536052703857, 7.403659820556641, 8.373783111572266, 9.343907356262207, 10.314031600952148, 11.284154891967773, 12.254278182983398, 13.22440242767334, 14.194526672363281, 15.164649963378906, 16.13477325439453, 17.104896545410156, 18.075021743774414, 19.04514503479004, 20.015268325805664, 20.985393524169922, 21.955516815185547, 22.925640106201172, 23.895763397216797, 24.865886688232422, 25.83601188659668, 26.806135177612305, 27.77625846862793, 28.746383666992188, 29.716506958007812, 30.686630249023438]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 20.0, 17.0, 21.0, 21.0, 16.0, 34.0, 31.0, 30.0, 31.0, 26.0, 45.0, 47.0, 19.0, 41.0, 33.0, 47.0, 37.0, 40.0, 41.0, 37.0, 48.0, 37.0, 24.0, 31.0, 33.0, 28.0, 21.0, 24.0, 14.0, 14.0, 14.0, 6.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.484619140625, -5.32080078125, -5.156982421875, -4.9931640625, -4.829345703125, -4.66552734375, -4.501708984375, -4.337890625, -4.174072265625, -4.01025390625, -3.846435546875, -3.6826171875, -3.518798828125, -3.35498046875, -3.191162109375, -3.02734375, -2.863525390625, -2.69970703125, -2.535888671875, -2.3720703125, -2.208251953125, -2.04443359375, -1.880615234375, -1.716796875, -1.552978515625, -1.38916015625, -1.225341796875, -1.0615234375, -0.897705078125, -0.73388671875, -0.570068359375, -0.40625, -0.242431640625, -0.07861328125, 0.085205078125, 0.2490234375, 0.412841796875, 0.57666015625, 0.740478515625, 0.904296875, 1.068115234375, 1.23193359375, 1.395751953125, 1.5595703125, 1.723388671875, 1.88720703125, 2.051025390625, 2.21484375, 2.378662109375, 2.54248046875, 2.706298828125, 2.8701171875, 3.033935546875, 3.19775390625, 3.361572265625, 3.525390625, 3.689208984375, 3.85302734375, 4.016845703125, 4.1806640625, 4.344482421875, 4.50830078125, 4.672119140625, 4.8359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 14.0, 13.0, 16.0, 28.0, 52.0, 77.0, 92.0, 140.0, 199.0, 250.0, 422.0, 546.0, 808.0, 1147.0, 1677.0, 2347.0, 3419.0, 5043.0, 7320.0, 10772.0, 15927.0, 24085.0, 36531.0, 56099.0, 88171.0, 140902.0, 190416.0, 163541.0, 104650.0, 65748.0, 42165.0, 27911.0, 18479.0, 12405.0, 8348.0, 5761.0, 4086.0, 2781.0, 1896.0, 1310.0, 873.0, 613.0, 402.0, 324.0, 239.0, 151.0, 132.0, 82.0, 56.0, 39.0, 19.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58984375, -0.57061767578125, -0.5513916015625, -0.53216552734375, -0.512939453125, -0.49371337890625, -0.4744873046875, -0.45526123046875, -0.43603515625, -0.41680908203125, -0.3975830078125, -0.37835693359375, -0.359130859375, -0.33990478515625, -0.3206787109375, -0.30145263671875, -0.2822265625, -0.26300048828125, -0.2437744140625, -0.22454833984375, -0.205322265625, -0.18609619140625, -0.1668701171875, -0.14764404296875, -0.12841796875, -0.10919189453125, -0.0899658203125, -0.07073974609375, -0.051513671875, -0.03228759765625, -0.0130615234375, 0.00616455078125, 0.025390625, 0.04461669921875, 0.0638427734375, 0.08306884765625, 0.102294921875, 0.12152099609375, 0.1407470703125, 0.15997314453125, 0.17919921875, 0.19842529296875, 0.2176513671875, 0.23687744140625, 0.256103515625, 0.27532958984375, 0.2945556640625, 0.31378173828125, 0.3330078125, 0.35223388671875, 0.3714599609375, 0.39068603515625, 0.409912109375, 0.42913818359375, 0.4483642578125, 0.46759033203125, 0.48681640625, 0.50604248046875, 0.5252685546875, 0.54449462890625, 0.563720703125, 0.58294677734375, 0.6021728515625, 0.62139892578125, 0.640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 2.0, 9.0, 6.0, 11.0, 12.0, 9.0, 8.0, 14.0, 19.0, 26.0, 25.0, 19.0, 22.0, 30.0, 35.0, 37.0, 26.0, 35.0, 30.0, 35.0, 42.0, 39.0, 1053.0, 31.0, 27.0, 37.0, 34.0, 34.0, 37.0, 31.0, 22.0, 22.0, 27.0, 17.0, 27.0, 20.0, 21.0, 12.0, 15.0, 10.0, 12.0, 5.0, 8.0, 8.0, 1.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.8046875, -2.712890625, -2.62109375, -2.529296875, -2.4375, -2.345703125, -2.25390625, -2.162109375, -2.0703125, -1.978515625, -1.88671875, -1.794921875, -1.703125, -1.611328125, -1.51953125, -1.427734375, -1.3359375, -1.244140625, -1.15234375, -1.060546875, -0.96875, -0.876953125, -0.78515625, -0.693359375, -0.6015625, -0.509765625, -0.41796875, -0.326171875, -0.234375, -0.142578125, -0.05078125, 0.041015625, 0.1328125, 0.224609375, 0.31640625, 0.408203125, 0.5, 0.591796875, 0.68359375, 0.775390625, 0.8671875, 0.958984375, 1.05078125, 1.142578125, 1.234375, 1.326171875, 1.41796875, 1.509765625, 1.6015625, 1.693359375, 1.78515625, 1.876953125, 1.96875, 2.060546875, 2.15234375, 2.244140625, 2.3359375, 2.427734375, 2.51953125, 2.611328125, 2.703125, 2.794921875, 2.88671875, 2.978515625, 3.0703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 14.0, 18.0, 26.0, 38.0, 68.0, 84.0, 164.0, 285.0, 460.0, 729.0, 1334.0, 2289.0, 4040.0, 7042.0, 12588.0, 23941.0, 45058.0, 91186.0, 185327.0, 1320255.0, 197367.0, 98680.0, 49290.0, 25191.0, 13798.0, 7491.0, 4278.0, 2468.0, 1443.0, 886.0, 476.0, 314.0, 184.0, 109.0, 72.0, 43.0, 31.0, 12.0, 16.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.810546875, -0.7889633178710938, -0.7673797607421875, -0.7457962036132812, -0.724212646484375, -0.7026290893554688, -0.6810455322265625, -0.6594619750976562, -0.63787841796875, -0.6162948608398438, -0.5947113037109375, -0.5731277465820312, -0.551544189453125, -0.5299606323242188, -0.5083770751953125, -0.48679351806640625, -0.4652099609375, -0.44362640380859375, -0.4220428466796875, -0.40045928955078125, -0.378875732421875, -0.35729217529296875, -0.3357086181640625, -0.31412506103515625, -0.29254150390625, -0.27095794677734375, -0.2493743896484375, -0.22779083251953125, -0.206207275390625, -0.18462371826171875, -0.1630401611328125, -0.14145660400390625, -0.119873046875, -0.09828948974609375, -0.0767059326171875, -0.05512237548828125, -0.033538818359375, -0.01195526123046875, 0.0096282958984375, 0.03121185302734375, 0.05279541015625, 0.07437896728515625, 0.0959625244140625, 0.11754608154296875, 0.139129638671875, 0.16071319580078125, 0.1822967529296875, 0.20388031005859375, 0.2254638671875, 0.24704742431640625, 0.2686309814453125, 0.29021453857421875, 0.311798095703125, 0.33338165283203125, 0.3549652099609375, 0.37654876708984375, 0.39813232421875, 0.41971588134765625, 0.4412994384765625, 0.46288299560546875, 0.484466552734375, 0.5060501098632812, 0.5276336669921875, 0.5492172241210938, 0.57080078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 10.0, 15.0, 10.0, 17.0, 22.0, 15.0, 30.0, 41.0, 33.0, 50.0, 43.0, 67.0, 61.0, 63.0, 68.0, 50.0, 56.0, 46.0, 57.0, 31.0, 29.0, 27.0, 24.0, 32.0, 18.0, 12.0, 17.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001987457275390625, -0.0019224882125854492, -0.0018575191497802734, -0.0017925500869750977, -0.0017275810241699219, -0.001662611961364746, -0.0015976428985595703, -0.0015326738357543945, -0.0014677047729492188, -0.001402735710144043, -0.0013377666473388672, -0.0012727975845336914, -0.0012078285217285156, -0.0011428594589233398, -0.001077890396118164, -0.0010129213333129883, -0.0009479522705078125, -0.0008829832077026367, -0.0008180141448974609, -0.0007530450820922852, -0.0006880760192871094, -0.0006231069564819336, -0.0005581378936767578, -0.000493168830871582, -0.00042819976806640625, -0.00036323070526123047, -0.0002982616424560547, -0.0002332925796508789, -0.00016832351684570312, -0.00010335445404052734, -3.838539123535156e-05, 2.658367156982422e-05, 9.1552734375e-05, 0.00015652179718017578, 0.00022149085998535156, 0.00028645992279052734, 0.0003514289855957031, 0.0004163980484008789, 0.0004813671112060547, 0.0005463361740112305, 0.0006113052368164062, 0.000676274299621582, 0.0007412433624267578, 0.0008062124252319336, 0.0008711814880371094, 0.0009361505508422852, 0.001001119613647461, 0.0010660886764526367, 0.0011310577392578125, 0.0011960268020629883, 0.001260995864868164, 0.0013259649276733398, 0.0013909339904785156, 0.0014559030532836914, 0.0015208721160888672, 0.001585841178894043, 0.0016508102416992188, 0.0017157793045043945, 0.0017807483673095703, 0.001845717430114746, 0.0019106864929199219, 0.0019756555557250977, 0.0020406246185302734, 0.0021055936813354492, 0.002170562744140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 2.0, 9.0, 17.0, 22.0, 24.0, 24.0, 29.0, 41.0, 68.0, 93.0, 121.0, 193.0, 383.0, 1394.0, 176131.0, 866623.0, 2189.0, 525.0, 215.0, 105.0, 71.0, 68.0, 52.0, 24.0, 23.0, 21.0, 18.0, 14.0, 18.0, 8.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.062347412109375, -0.060753822326660156, -0.05916023254394531, -0.05756664276123047, -0.055973052978515625, -0.05437946319580078, -0.05278587341308594, -0.051192283630371094, -0.04959869384765625, -0.048005104064941406, -0.04641151428222656, -0.04481792449951172, -0.043224334716796875, -0.04163074493408203, -0.04003715515136719, -0.038443565368652344, -0.0368499755859375, -0.035256385803222656, -0.03366279602050781, -0.03206920623779297, -0.030475616455078125, -0.02888202667236328, -0.027288436889648438, -0.025694847106933594, -0.02410125732421875, -0.022507667541503906, -0.020914077758789062, -0.01932048797607422, -0.017726898193359375, -0.01613330841064453, -0.014539718627929688, -0.012946128845214844, -0.0113525390625, -0.009758949279785156, -0.008165359497070312, -0.006571769714355469, -0.004978179931640625, -0.0033845901489257812, -0.0017910003662109375, -0.00019741058349609375, 0.00139617919921875, 0.0029897689819335938, 0.0045833587646484375, 0.006176948547363281, 0.007770538330078125, 0.009364128112792969, 0.010957717895507812, 0.012551307678222656, 0.0141448974609375, 0.015738487243652344, 0.017332077026367188, 0.01892566680908203, 0.020519256591796875, 0.02211284637451172, 0.023706436157226562, 0.025300025939941406, 0.02689361572265625, 0.028487205505371094, 0.030080795288085938, 0.03167438507080078, 0.033267974853515625, 0.03486156463623047, 0.03645515441894531, 0.038048744201660156, 0.039642333984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 46.0, 849.0, 120.0, 1.0, 1.0], "bins": [-0.026967698708176613, -0.026522818952798843, -0.026077939197421074, -0.025633061304688454, -0.025188181549310684, -0.024743301793932915, -0.024298422038555145, -0.023853542283177376, -0.023408664390444756, -0.022963784635066986, -0.022518904879689217, -0.022074026986956596, -0.021629147231578827, -0.021184267476201057, -0.020739387720823288, -0.02029450796544552, -0.01984962821006775, -0.01940474845468998, -0.01895986869931221, -0.01851499080657959, -0.01807011105120182, -0.01762523129582405, -0.01718035154044628, -0.016735471785068512, -0.01629059389233589, -0.015845714136958122, -0.015400835312902927, -0.014955955557525158, -0.014511076733469963, -0.014066196978092194, -0.013621317222714424, -0.01317643839865923, -0.01273155864328146, -0.01228667888790369, -0.011841800063848495, -0.011396920308470726, -0.010952041484415531, -0.010507161729037762, -0.010062282904982567, -0.009617403149604797, -0.009172523394227028, -0.008727643638849258, -0.008282764814794064, -0.007837885059416294, -0.007393005769699812, -0.00694812647998333, -0.006503247190266848, -0.0060583679005503654, -0.005613488145172596, -0.005168608855456114, -0.004723729565739632, -0.004278849810361862, -0.00383397052064538, -0.003389091230928898, -0.0029442119412124157, -0.00249933241866529, -0.0020544533617794514, -0.0016095739556476474, -0.0011646945495158434, -0.0007198152597993612, -0.00027493585366755724, 0.00016994355246424675, 0.0006148228421807289, 0.0010597023647278547, 0.0015045816544443369]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 10.0, 19.0, 23.0, 20.0, 28.0, 22.0, 43.0, 36.0, 51.0, 42.0, 47.0, 42.0, 45.0, 55.0, 35.0, 60.0, 52.0, 51.0, 52.0, 39.0, 35.0, 36.0, 27.0, 20.0, 14.0, 20.0, 17.0, 10.0, 10.0, 6.0, 2.0, 1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001035928726196289, -0.0009940741583704948, -0.0009522195905447006, -0.0009103650227189064, -0.0008685104548931122, -0.000826655887067318, -0.0007848013192415237, -0.0007429467514157295, -0.0007010921835899353, -0.0006592376157641411, -0.0006173830479383469, -0.0005755284801125526, -0.0005336739122867584, -0.0004918193444609642, -0.00044996477663517, -0.00040811020880937576, -0.00036625564098358154, -0.0003244010731577873, -0.0002825465053319931, -0.00024069193750619888, -0.00019883736968040466, -0.00015698280185461044, -0.00011512823402881622, -7.3273666203022e-05, -3.141909837722778e-05, 1.0435469448566437e-05, 5.229003727436066e-05, 9.414460510015488e-05, 0.0001359991729259491, 0.00017785374075174332, 0.00021970830857753754, 0.00026156287640333176, 0.000303417444229126, 0.0003452720120549202, 0.0003871265798807144, 0.00042898114770650864, 0.00047083571553230286, 0.0005126902833580971, 0.0005545448511838913, 0.0005963994190096855, 0.0006382539868354797, 0.000680108554661274, 0.0007219631224870682, 0.0007638176903128624, 0.0008056722581386566, 0.0008475268259644508, 0.0008893813937902451, 0.0009312359616160393, 0.0009730905294418335, 0.0010149450972676277, 0.001056799665093422, 0.0010986542329192162, 0.0011405088007450104, 0.0011823633685708046, 0.0012242179363965988, 0.001266072504222393, 0.0013079270720481873, 0.0013497816398739815, 0.0013916362076997757, 0.00143349077552557, 0.0014753453433513641, 0.0015171999111771584, 0.0015590544790029526, 0.0016009090468287468, 0.001642763614654541]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 20.0, 17.0, 21.0, 21.0, 16.0, 34.0, 31.0, 30.0, 31.0, 26.0, 45.0, 47.0, 19.0, 41.0, 33.0, 47.0, 37.0, 40.0, 41.0, 37.0, 48.0, 37.0, 24.0, 31.0, 34.0, 27.0, 21.0, 24.0, 14.0, 14.0, 14.0, 6.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.484619140625, -5.32080078125, -5.156982421875, -4.9931640625, -4.829345703125, -4.66552734375, -4.501708984375, -4.337890625, -4.174072265625, -4.01025390625, -3.846435546875, -3.6826171875, -3.518798828125, -3.35498046875, -3.191162109375, -3.02734375, -2.863525390625, -2.69970703125, -2.535888671875, -2.3720703125, -2.208251953125, -2.04443359375, -1.880615234375, -1.716796875, -1.552978515625, -1.38916015625, -1.225341796875, -1.0615234375, -0.897705078125, -0.73388671875, -0.570068359375, -0.40625, -0.242431640625, -0.07861328125, 0.085205078125, 0.2490234375, 0.412841796875, 0.57666015625, 0.740478515625, 0.904296875, 1.068115234375, 1.23193359375, 1.395751953125, 1.5595703125, 1.723388671875, 1.88720703125, 2.051025390625, 2.21484375, 2.378662109375, 2.54248046875, 2.706298828125, 2.8701171875, 3.033935546875, 3.19775390625, 3.361572265625, 3.525390625, 3.689208984375, 3.85302734375, 4.016845703125, 4.1806640625, 4.344482421875, 4.50830078125, 4.672119140625, 4.8359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 7.0, 6.0, 13.0, 15.0, 34.0, 60.0, 64.0, 85.0, 151.0, 177.0, 305.0, 478.0, 746.0, 1157.0, 1913.0, 3385.0, 5838.0, 11102.0, 21667.0, 47833.0, 115371.0, 312733.0, 314018.0, 116013.0, 47485.0, 22263.0, 11033.0, 5890.0, 3445.0, 1984.0, 1212.0, 693.0, 443.0, 315.0, 173.0, 122.0, 94.0, 74.0, 53.0, 29.0, 26.0, 15.0, 9.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.86328125, -3.749664306640625, -3.63604736328125, -3.522430419921875, -3.4088134765625, -3.295196533203125, -3.18157958984375, -3.067962646484375, -2.954345703125, -2.840728759765625, -2.72711181640625, -2.613494873046875, -2.4998779296875, -2.386260986328125, -2.27264404296875, -2.159027099609375, -2.04541015625, -1.931793212890625, -1.81817626953125, -1.704559326171875, -1.5909423828125, -1.477325439453125, -1.36370849609375, -1.250091552734375, -1.136474609375, -1.022857666015625, -0.90924072265625, -0.795623779296875, -0.6820068359375, -0.568389892578125, -0.45477294921875, -0.341156005859375, -0.2275390625, -0.113922119140625, -0.00030517578125, 0.113311767578125, 0.2269287109375, 0.340545654296875, 0.45416259765625, 0.567779541015625, 0.681396484375, 0.795013427734375, 0.90863037109375, 1.022247314453125, 1.1358642578125, 1.249481201171875, 1.36309814453125, 1.476715087890625, 1.59033203125, 1.703948974609375, 1.81756591796875, 1.931182861328125, 2.0447998046875, 2.158416748046875, 2.27203369140625, 2.385650634765625, 2.499267578125, 2.612884521484375, 2.72650146484375, 2.840118408203125, 2.9537353515625, 3.067352294921875, 3.18096923828125, 3.294586181640625, 3.408203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 11.0, 10.0, 9.0, 14.0, 14.0, 11.0, 17.0, 26.0, 27.0, 22.0, 31.0, 43.0, 45.0, 49.0, 52.0, 82.0, 136.0, 1586.0, 268.0, 99.0, 69.0, 56.0, 37.0, 40.0, 43.0, 41.0, 31.0, 22.0, 25.0, 19.0, 23.0, 16.0, 15.0, 6.0, 9.0, 5.0, 9.0, 2.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.0286865234375, -17.494873046875, -16.9610595703125, -16.42724609375, -15.8934326171875, -15.359619140625, -14.8258056640625, -14.2919921875, -13.7581787109375, -13.224365234375, -12.6905517578125, -12.15673828125, -11.6229248046875, -11.089111328125, -10.5552978515625, -10.021484375, -9.4876708984375, -8.953857421875, -8.4200439453125, -7.88623046875, -7.3524169921875, -6.818603515625, -6.2847900390625, -5.7509765625, -5.2171630859375, -4.683349609375, -4.1495361328125, -3.61572265625, -3.0819091796875, -2.548095703125, -2.0142822265625, -1.48046875, -0.9466552734375, -0.412841796875, 0.1209716796875, 0.65478515625, 1.1885986328125, 1.722412109375, 2.2562255859375, 2.7900390625, 3.3238525390625, 3.857666015625, 4.3914794921875, 4.92529296875, 5.4591064453125, 5.992919921875, 6.5267333984375, 7.060546875, 7.5943603515625, 8.128173828125, 8.6619873046875, 9.19580078125, 9.7296142578125, 10.263427734375, 10.7972412109375, 11.3310546875, 11.8648681640625, 12.398681640625, 12.9324951171875, 13.46630859375, 14.0001220703125, 14.533935546875, 15.0677490234375, 15.6015625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 18.0, 37.0, 66.0, 119.0, 223.0, 404.0, 941.0, 2124166.0, 1018014.0, 894.0, 352.0, 197.0, 102.0, 66.0, 35.0, 28.0, 8.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.125, -115.015625, -111.90625, -108.796875, -105.6875, -102.578125, -99.46875, -96.359375, -93.25, -90.140625, -87.03125, -83.921875, -80.8125, -77.703125, -74.59375, -71.484375, -68.375, -65.265625, -62.15625, -59.046875, -55.9375, -52.828125, -49.71875, -46.609375, -43.5, -40.390625, -37.28125, -34.171875, -31.0625, -27.953125, -24.84375, -21.734375, -18.625, -15.515625, -12.40625, -9.296875, -6.1875, -3.078125, 0.03125, 3.140625, 6.25, 9.359375, 12.46875, 15.578125, 18.6875, 21.796875, 24.90625, 28.015625, 31.125, 34.234375, 37.34375, 40.453125, 43.5625, 46.671875, 49.78125, 52.890625, 56.0, 59.109375, 62.21875, 65.328125, 68.4375, 71.546875, 74.65625, 77.765625, 80.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [912.0, 108.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.222808837890625, 2.0210132598876953, 13.264835357666016, 24.50865936279297, 35.752479553222656, 46.996299743652344, 58.24012756347656, 69.48394775390625, 80.72776794433594, 91.97158813476562, 103.21540832519531, 114.45923614501953, 125.70305633544922, 136.94686889648438, 148.19070434570312, 159.4345245361328, 170.6783447265625, 181.9221649169922, 193.16598510742188, 204.40982055664062, 215.65362548828125, 226.8974609375, 238.1412811279297, 249.38510131835938, 260.62890625, 271.87274169921875, 283.1165466308594, 294.3603820800781, 305.60418701171875, 316.8480224609375, 328.09185791015625, 339.3356628417969, 350.57952880859375, 361.8233642578125, 373.0671691894531, 384.3110046386719, 395.5548095703125, 406.79864501953125, 418.04248046875, 429.2862854003906, 440.53009033203125, 451.77392578125, 463.0177307128906, 474.2615661621094, 485.50537109375, 496.74920654296875, 507.9930419921875, 519.23681640625, 530.480712890625, 541.7245483398438, 552.9683837890625, 564.212158203125, 575.4559936523438, 586.6998291015625, 597.9436645507812, 609.1875, 620.4312744140625, 631.6751098632812, 642.9189453125, 654.1627197265625, 665.4065551757812, 676.650390625, 687.8942260742188, 699.1380615234375, 710.3818359375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 6.0, 3.0, 4.0, 5.0, 14.0, 10.0, 7.0, 14.0, 19.0, 20.0, 25.0, 25.0, 19.0, 29.0, 26.0, 34.0, 31.0, 30.0, 45.0, 45.0, 49.0, 49.0, 43.0, 37.0, 42.0, 44.0, 44.0, 37.0, 27.0, 35.0, 32.0, 18.0, 29.0, 19.0, 29.0, 7.0, 16.0, 10.0, 12.0, 2.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.857139587402344, -52.239131927490234, -50.621124267578125, -49.003116607666016, -47.385108947753906, -45.7671012878418, -44.14909362792969, -42.531089782714844, -40.91307830810547, -39.29507064819336, -37.67706298828125, -36.05905532836914, -34.44104766845703, -32.82304000854492, -31.205034255981445, -29.587026596069336, -27.96902084350586, -26.35101318359375, -24.73300552368164, -23.11499786376953, -21.496990203857422, -19.878982543945312, -18.260976791381836, -16.642969131469727, -15.024961471557617, -13.406953811645508, -11.788946151733398, -10.170939445495605, -8.552931785583496, -6.934924125671387, -5.316917419433594, -3.6989097595214844, -2.080902099609375, -0.4628946781158447, 1.1551127433776855, 2.7731199264526367, 4.391127586364746, 6.0091352462768555, 7.627141952514648, 9.245149612426758, 10.863157272338867, 12.481164932250977, 14.099172592163086, 15.717179298400879, 17.335186004638672, 18.95319366455078, 20.57120132446289, 22.189208984375, 23.80721664428711, 25.42522430419922, 27.043231964111328, 28.661239624023438, 30.279247283935547, 31.897254943847656, 33.5152587890625, 35.133270263671875, 36.75127410888672, 38.36928176879883, 39.98728942871094, 41.60529708862305, 43.223304748535156, 44.841312408447266, 46.459320068359375, 48.07732391357422, 49.695335388183594]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 11.0, 10.0, 13.0, 14.0, 14.0, 24.0, 30.0, 26.0, 25.0, 33.0, 28.0, 28.0, 34.0, 36.0, 46.0, 34.0, 37.0, 38.0, 46.0, 42.0, 38.0, 33.0, 48.0, 32.0, 29.0, 28.0, 24.0, 30.0, 31.0, 14.0, 20.0, 20.0, 16.0, 10.0, 11.0, 7.0, 5.0, 3.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-5.87109375, -5.7021484375, -5.533203125, -5.3642578125, -5.1953125, -5.0263671875, -4.857421875, -4.6884765625, -4.51953125, -4.3505859375, -4.181640625, -4.0126953125, -3.84375, -3.6748046875, -3.505859375, -3.3369140625, -3.16796875, -2.9990234375, -2.830078125, -2.6611328125, -2.4921875, -2.3232421875, -2.154296875, -1.9853515625, -1.81640625, -1.6474609375, -1.478515625, -1.3095703125, -1.140625, -0.9716796875, -0.802734375, -0.6337890625, -0.46484375, -0.2958984375, -0.126953125, 0.0419921875, 0.2109375, 0.3798828125, 0.548828125, 0.7177734375, 0.88671875, 1.0556640625, 1.224609375, 1.3935546875, 1.5625, 1.7314453125, 1.900390625, 2.0693359375, 2.23828125, 2.4072265625, 2.576171875, 2.7451171875, 2.9140625, 3.0830078125, 3.251953125, 3.4208984375, 3.58984375, 3.7587890625, 3.927734375, 4.0966796875, 4.265625, 4.4345703125, 4.603515625, 4.7724609375, 4.94140625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 4.0, 7.0, 7.0, 8.0, 19.0, 11.0, 15.0, 22.0, 27.0, 19.0, 29.0, 37.0, 89.0, 105.0, 207.0, 482.0, 1284.0, 4806.0, 34978.0, 632244.0, 2877699.0, 601026.0, 33970.0, 4794.0, 1275.0, 506.0, 192.0, 110.0, 60.0, 35.0, 39.0, 21.0, 28.0, 21.0, 13.0, 19.0, 18.0, 8.0, 10.0, 10.0, 5.0, 1.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.7578125, -13.3209228515625, -12.884033203125, -12.4471435546875, -12.01025390625, -11.5733642578125, -11.136474609375, -10.6995849609375, -10.2626953125, -9.8258056640625, -9.388916015625, -8.9520263671875, -8.51513671875, -8.0782470703125, -7.641357421875, -7.2044677734375, -6.767578125, -6.3306884765625, -5.893798828125, -5.4569091796875, -5.02001953125, -4.5831298828125, -4.146240234375, -3.7093505859375, -3.2724609375, -2.8355712890625, -2.398681640625, -1.9617919921875, -1.52490234375, -1.0880126953125, -0.651123046875, -0.2142333984375, 0.22265625, 0.6595458984375, 1.096435546875, 1.5333251953125, 1.97021484375, 2.4071044921875, 2.843994140625, 3.2808837890625, 3.7177734375, 4.1546630859375, 4.591552734375, 5.0284423828125, 5.46533203125, 5.9022216796875, 6.339111328125, 6.7760009765625, 7.212890625, 7.6497802734375, 8.086669921875, 8.5235595703125, 8.96044921875, 9.3973388671875, 9.834228515625, 10.2711181640625, 10.7080078125, 11.1448974609375, 11.581787109375, 12.0186767578125, 12.45556640625, 12.8924560546875, 13.329345703125, 13.7662353515625, 14.203125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 12.0, 10.0, 13.0, 22.0, 34.0, 29.0, 43.0, 50.0, 69.0, 75.0, 128.0, 167.0, 189.0, 242.0, 357.0, 399.0, 373.0, 362.0, 328.0, 272.0, 221.0, 155.0, 133.0, 81.0, 70.0, 42.0, 51.0, 27.0, 32.0, 15.0, 10.0, 12.0, 9.0, 9.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.97265625, -8.6875, -8.40234375, -8.1171875, -7.83203125, -7.546875, -7.26171875, -6.9765625, -6.69140625, -6.40625, -6.12109375, -5.8359375, -5.55078125, -5.265625, -4.98046875, -4.6953125, -4.41015625, -4.125, -3.83984375, -3.5546875, -3.26953125, -2.984375, -2.69921875, -2.4140625, -2.12890625, -1.84375, -1.55859375, -1.2734375, -0.98828125, -0.703125, -0.41796875, -0.1328125, 0.15234375, 0.4375, 0.72265625, 1.0078125, 1.29296875, 1.578125, 1.86328125, 2.1484375, 2.43359375, 2.71875, 3.00390625, 3.2890625, 3.57421875, 3.859375, 4.14453125, 4.4296875, 4.71484375, 5.0, 5.28515625, 5.5703125, 5.85546875, 6.140625, 6.42578125, 6.7109375, 6.99609375, 7.28125, 7.56640625, 7.8515625, 8.13671875, 8.421875, 8.70703125, 8.9921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 13.0, 3.0, 9.0, 13.0, 18.0, 31.0, 30.0, 39.0, 47.0, 70.0, 88.0, 129.0, 146.0, 205.0, 252.0, 384.0, 886.0, 14011.0, 3469605.0, 702230.0, 4118.0, 596.0, 332.0, 227.0, 168.0, 144.0, 95.0, 85.0, 76.0, 51.0, 34.0, 40.0, 28.0, 21.0, 16.0, 5.0, 7.0, 6.0, 2.0, 11.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.96875, -43.64013671875, -42.3115234375, -40.98291015625, -39.654296875, -38.32568359375, -36.9970703125, -35.66845703125, -34.33984375, -33.01123046875, -31.6826171875, -30.35400390625, -29.025390625, -27.69677734375, -26.3681640625, -25.03955078125, -23.7109375, -22.38232421875, -21.0537109375, -19.72509765625, -18.396484375, -17.06787109375, -15.7392578125, -14.41064453125, -13.08203125, -11.75341796875, -10.4248046875, -9.09619140625, -7.767578125, -6.43896484375, -5.1103515625, -3.78173828125, -2.453125, -1.12451171875, 0.2041015625, 1.53271484375, 2.861328125, 4.18994140625, 5.5185546875, 6.84716796875, 8.17578125, 9.50439453125, 10.8330078125, 12.16162109375, 13.490234375, 14.81884765625, 16.1474609375, 17.47607421875, 18.8046875, 20.13330078125, 21.4619140625, 22.79052734375, 24.119140625, 25.44775390625, 26.7763671875, 28.10498046875, 29.43359375, 30.76220703125, 32.0908203125, 33.41943359375, 34.748046875, 36.07666015625, 37.4052734375, 38.73388671875, 40.0625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 11.0, 18.0, 37.0, 45.0, 74.0, 104.0, 95.0, 115.0, 106.0, 118.0, 99.0, 60.0, 57.0, 28.0, 13.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.936431884765625, -31.567873001098633, -30.199316024780273, -28.83075714111328, -27.462200164794922, -26.09364128112793, -24.725082397460938, -23.356525421142578, -21.987966537475586, -20.619407653808594, -19.250850677490234, -17.882291793823242, -16.51373291015625, -15.14517593383789, -13.776617050170898, -12.408059120178223, -11.039501190185547, -9.670943260192871, -8.302385330200195, -6.933826446533203, -5.565268516540527, -4.196710586547852, -2.8281517028808594, -1.4595937728881836, -0.09103584289550781, 1.277522325515747, 2.646080493927002, 4.014638900756836, 5.383196830749512, 6.7517547607421875, 8.12031364440918, 9.488871574401855, 10.857425689697266, 12.225983619689941, 13.594541549682617, 14.96310043334961, 16.33165740966797, 17.70021629333496, 19.068775177001953, 20.437332153320312, 21.805891036987305, 23.174449920654297, 24.543006896972656, 25.91156578063965, 27.28012466430664, 28.648681640625, 30.017240524291992, 31.385799407958984, 32.754356384277344, 34.1229133605957, 35.49147415161133, 36.86003112792969, 38.22858810424805, 39.597145080566406, 40.96570587158203, 42.33426284790039, 43.70281982421875, 45.07137680053711, 46.439937591552734, 47.808494567871094, 49.17705154418945, 50.54560852050781, 51.91416931152344, 53.2827262878418, 54.65128707885742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 4.0, 5.0, 12.0, 7.0, 16.0, 20.0, 17.0, 14.0, 26.0, 19.0, 28.0, 27.0, 32.0, 29.0, 35.0, 37.0, 35.0, 48.0, 31.0, 44.0, 34.0, 36.0, 35.0, 34.0, 35.0, 41.0, 24.0, 38.0, 29.0, 27.0, 21.0, 17.0, 17.0, 19.0, 18.0, 9.0, 18.0, 9.0, 8.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.09229278564453, -31.064437866210938, -30.036582946777344, -29.00872802734375, -27.980873107910156, -26.953018188476562, -25.92516326904297, -24.897308349609375, -23.86945343017578, -22.841598510742188, -21.813743591308594, -20.785888671875, -19.758033752441406, -18.730178833007812, -17.70232391357422, -16.674468994140625, -15.646614074707031, -14.618759155273438, -13.590904235839844, -12.56304931640625, -11.535194396972656, -10.507339477539062, -9.479484558105469, -8.451629638671875, -7.423774719238281, -6.3959197998046875, -5.368064880371094, -4.3402099609375, -3.3123550415039062, -2.2845001220703125, -1.2566452026367188, -0.228790283203125, 0.7990646362304688, 1.8269195556640625, 2.8547744750976562, 3.88262939453125, 4.910484313964844, 5.9383392333984375, 6.966194152832031, 7.994049072265625, 9.021903991699219, 10.049758911132812, 11.077613830566406, 12.10546875, 13.133323669433594, 14.161178588867188, 15.189033508300781, 16.216888427734375, 17.24474334716797, 18.272598266601562, 19.300453186035156, 20.32830810546875, 21.356163024902344, 22.384017944335938, 23.41187286376953, 24.439727783203125, 25.46758270263672, 26.495437622070312, 27.523292541503906, 28.5511474609375, 29.579002380371094, 30.606857299804688, 31.63471221923828, 32.662567138671875, 33.69042205810547]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 13.0, 18.0, 15.0, 23.0, 20.0, 14.0, 29.0, 26.0, 37.0, 32.0, 24.0, 44.0, 43.0, 36.0, 43.0, 33.0, 52.0, 38.0, 47.0, 43.0, 42.0, 29.0, 32.0, 31.0, 31.0, 26.0, 14.0, 24.0, 19.0, 15.0, 16.0, 8.0, 14.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.703125, -5.54095458984375, -5.3787841796875, -5.21661376953125, -5.054443359375, -4.89227294921875, -4.7301025390625, -4.56793212890625, -4.40576171875, -4.24359130859375, -4.0814208984375, -3.91925048828125, -3.757080078125, -3.59490966796875, -3.4327392578125, -3.27056884765625, -3.1083984375, -2.94622802734375, -2.7840576171875, -2.62188720703125, -2.459716796875, -2.29754638671875, -2.1353759765625, -1.97320556640625, -1.81103515625, -1.64886474609375, -1.4866943359375, -1.32452392578125, -1.162353515625, -1.00018310546875, -0.8380126953125, -0.67584228515625, -0.513671875, -0.35150146484375, -0.1893310546875, -0.02716064453125, 0.135009765625, 0.29718017578125, 0.4593505859375, 0.62152099609375, 0.78369140625, 0.94586181640625, 1.1080322265625, 1.27020263671875, 1.432373046875, 1.59454345703125, 1.7567138671875, 1.91888427734375, 2.0810546875, 2.24322509765625, 2.4053955078125, 2.56756591796875, 2.729736328125, 2.89190673828125, 3.0540771484375, 3.21624755859375, 3.37841796875, 3.54058837890625, 3.7027587890625, 3.86492919921875, 4.027099609375, 4.18927001953125, 4.3514404296875, 4.51361083984375, 4.67578125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 1.0, 14.0, 5.0, 11.0, 23.0, 25.0, 54.0, 73.0, 98.0, 163.0, 280.0, 409.0, 579.0, 790.0, 1133.0, 1603.0, 2387.0, 3344.0, 4882.0, 7184.0, 10448.0, 15888.0, 24413.0, 38303.0, 60910.0, 101705.0, 169350.0, 209978.0, 150240.0, 89455.0, 54109.0, 33871.0, 21791.0, 14173.0, 9667.0, 6793.0, 4585.0, 3116.0, 2050.0, 1426.0, 999.0, 705.0, 454.0, 340.0, 222.0, 126.0, 123.0, 76.0, 67.0, 34.0, 28.0, 19.0, 22.0, 6.0, 8.0, 1.0, 2.0], "bins": [-0.69970703125, -0.679351806640625, -0.65899658203125, -0.638641357421875, -0.6182861328125, -0.597930908203125, -0.57757568359375, -0.557220458984375, -0.536865234375, -0.516510009765625, -0.49615478515625, -0.475799560546875, -0.4554443359375, -0.435089111328125, -0.41473388671875, -0.394378662109375, -0.3740234375, -0.353668212890625, -0.33331298828125, -0.312957763671875, -0.2926025390625, -0.272247314453125, -0.25189208984375, -0.231536865234375, -0.211181640625, -0.190826416015625, -0.17047119140625, -0.150115966796875, -0.1297607421875, -0.109405517578125, -0.08905029296875, -0.068695068359375, -0.04833984375, -0.027984619140625, -0.00762939453125, 0.012725830078125, 0.0330810546875, 0.053436279296875, 0.07379150390625, 0.094146728515625, 0.114501953125, 0.134857177734375, 0.15521240234375, 0.175567626953125, 0.1959228515625, 0.216278076171875, 0.23663330078125, 0.256988525390625, 0.27734375, 0.297698974609375, 0.31805419921875, 0.338409423828125, 0.3587646484375, 0.379119873046875, 0.39947509765625, 0.419830322265625, 0.440185546875, 0.460540771484375, 0.48089599609375, 0.501251220703125, 0.5216064453125, 0.541961669921875, 0.56231689453125, 0.582672119140625, 0.60302734375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 11.0, 8.0, 14.0, 7.0, 13.0, 16.0, 22.0, 25.0, 26.0, 33.0, 27.0, 31.0, 29.0, 23.0, 29.0, 39.0, 47.0, 43.0, 43.0, 1064.0, 39.0, 37.0, 34.0, 23.0, 33.0, 39.0, 31.0, 28.0, 24.0, 24.0, 24.0, 19.0, 15.0, 14.0, 14.0, 11.0, 14.0, 8.0, 6.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.62890625, -3.531341552734375, -3.43377685546875, -3.336212158203125, -3.2386474609375, -3.141082763671875, -3.04351806640625, -2.945953369140625, -2.848388671875, -2.750823974609375, -2.65325927734375, -2.555694580078125, -2.4581298828125, -2.360565185546875, -2.26300048828125, -2.165435791015625, -2.06787109375, -1.970306396484375, -1.87274169921875, -1.775177001953125, -1.6776123046875, -1.580047607421875, -1.48248291015625, -1.384918212890625, -1.287353515625, -1.189788818359375, -1.09222412109375, -0.994659423828125, -0.8970947265625, -0.799530029296875, -0.70196533203125, -0.604400634765625, -0.5068359375, -0.409271240234375, -0.31170654296875, -0.214141845703125, -0.1165771484375, -0.019012451171875, 0.07855224609375, 0.176116943359375, 0.273681640625, 0.371246337890625, 0.46881103515625, 0.566375732421875, 0.6639404296875, 0.761505126953125, 0.85906982421875, 0.956634521484375, 1.05419921875, 1.151763916015625, 1.24932861328125, 1.346893310546875, 1.4444580078125, 1.542022705078125, 1.63958740234375, 1.737152099609375, 1.834716796875, 1.932281494140625, 2.02984619140625, 2.127410888671875, 2.2249755859375, 2.322540283203125, 2.42010498046875, 2.517669677734375, 2.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 18.0, 33.0, 50.0, 62.0, 91.0, 143.0, 220.0, 379.0, 591.0, 946.0, 1561.0, 2542.0, 4224.0, 7150.0, 12628.0, 23002.0, 42090.0, 79174.0, 151165.0, 1287787.0, 216355.0, 122861.0, 64728.0, 34763.0, 18684.0, 10523.0, 6013.0, 3559.0, 2113.0, 1290.0, 842.0, 538.0, 342.0, 244.0, 137.0, 96.0, 45.0, 38.0, 34.0, 18.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64990234375, -0.6301116943359375, -0.610321044921875, -0.5905303955078125, -0.57073974609375, -0.5509490966796875, -0.531158447265625, -0.5113677978515625, -0.4915771484375, -0.4717864990234375, -0.451995849609375, -0.4322052001953125, -0.41241455078125, -0.3926239013671875, -0.372833251953125, -0.3530426025390625, -0.333251953125, -0.3134613037109375, -0.293670654296875, -0.2738800048828125, -0.25408935546875, -0.2342987060546875, -0.214508056640625, -0.1947174072265625, -0.1749267578125, -0.1551361083984375, -0.135345458984375, -0.1155548095703125, -0.09576416015625, -0.0759735107421875, -0.056182861328125, -0.0363922119140625, -0.0166015625, 0.0031890869140625, 0.022979736328125, 0.0427703857421875, 0.06256103515625, 0.0823516845703125, 0.102142333984375, 0.1219329833984375, 0.1417236328125, 0.1615142822265625, 0.181304931640625, 0.2010955810546875, 0.22088623046875, 0.2406768798828125, 0.260467529296875, 0.2802581787109375, 0.300048828125, 0.3198394775390625, 0.339630126953125, 0.3594207763671875, 0.37921142578125, 0.3990020751953125, 0.418792724609375, 0.4385833740234375, 0.4583740234375, 0.4781646728515625, 0.497955322265625, 0.5177459716796875, 0.53753662109375, 0.5573272705078125, 0.577117919921875, 0.5969085693359375, 0.61669921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 11.0, 12.0, 10.0, 11.0, 13.0, 25.0, 10.0, 22.0, 27.0, 30.0, 39.0, 42.0, 38.0, 39.0, 57.0, 56.0, 48.0, 58.0, 57.0, 46.0, 41.0, 50.0, 37.0, 32.0, 35.0, 27.0, 15.0, 24.0, 14.0, 8.0, 10.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002185821533203125, -0.002126649022102356, -0.002067476511001587, -0.002008303999900818, -0.0019491314888000488, -0.0018899589776992798, -0.0018307864665985107, -0.0017716139554977417, -0.0017124414443969727, -0.0016532689332962036, -0.0015940964221954346, -0.0015349239110946655, -0.0014757513999938965, -0.0014165788888931274, -0.0013574063777923584, -0.0012982338666915894, -0.0012390613555908203, -0.0011798888444900513, -0.0011207163333892822, -0.0010615438222885132, -0.0010023713111877441, -0.0009431988000869751, -0.0008840262889862061, -0.000824853777885437, -0.000765681266784668, -0.0007065087556838989, -0.0006473362445831299, -0.0005881637334823608, -0.0005289912223815918, -0.00046981871128082275, -0.0004106462001800537, -0.00035147368907928467, -0.0002923011779785156, -0.00023312866687774658, -0.00017395615577697754, -0.0001147836446762085, -5.561113357543945e-05, 3.56137752532959e-06, 6.273388862609863e-05, 0.00012190639972686768, 0.00018107891082763672, 0.00024025142192840576, 0.0002994239330291748, 0.00035859644412994385, 0.0004177689552307129, 0.00047694146633148193, 0.000536113977432251, 0.00059528648853302, 0.0006544589996337891, 0.0007136315107345581, 0.0007728040218353271, 0.0008319765329360962, 0.0008911490440368652, 0.0009503215551376343, 0.0010094940662384033, 0.0010686665773391724, 0.0011278390884399414, 0.0011870115995407104, 0.0012461841106414795, 0.0013053566217422485, 0.0013645291328430176, 0.0014237016439437866, 0.0014828741550445557, 0.0015420466661453247, 0.0016012191772460938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 7.0, 11.0, 21.0, 22.0, 20.0, 29.0, 29.0, 42.0, 66.0, 58.0, 85.0, 127.0, 209.0, 439.0, 1140.0, 29294.0, 1001116.0, 13762.0, 937.0, 383.0, 175.0, 128.0, 99.0, 58.0, 52.0, 51.0, 39.0, 29.0, 22.0, 19.0, 10.0, 12.0, 12.0, 9.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.034637451171875, -0.033374786376953125, -0.03211212158203125, -0.030849456787109375, -0.0295867919921875, -0.028324127197265625, -0.02706146240234375, -0.025798797607421875, -0.0245361328125, -0.023273468017578125, -0.02201080322265625, -0.020748138427734375, -0.0194854736328125, -0.018222808837890625, -0.01696014404296875, -0.015697479248046875, -0.014434814453125, -0.013172149658203125, -0.01190948486328125, -0.010646820068359375, -0.0093841552734375, -0.008121490478515625, -0.00685882568359375, -0.005596160888671875, -0.00433349609375, -0.003070831298828125, -0.00180816650390625, -0.000545501708984375, 0.0007171630859375, 0.001979827880859375, 0.00324249267578125, 0.004505157470703125, 0.005767822265625, 0.007030487060546875, 0.00829315185546875, 0.009555816650390625, 0.0108184814453125, 0.012081146240234375, 0.01334381103515625, 0.014606475830078125, 0.015869140625, 0.017131805419921875, 0.01839447021484375, 0.019657135009765625, 0.0209197998046875, 0.022182464599609375, 0.02344512939453125, 0.024707794189453125, 0.025970458984375, 0.027233123779296875, 0.02849578857421875, 0.029758453369140625, 0.0310211181640625, 0.032283782958984375, 0.03354644775390625, 0.034809112548828125, 0.03607177734375, 0.037334442138671875, 0.03859710693359375, 0.039859771728515625, 0.0411224365234375, 0.042385101318359375, 0.04364776611328125, 0.044910430908203125, 0.046173095703125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 35.0, 958.0, 23.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03621470928192139, -0.03551113232970238, -0.034807559102773666, -0.03410398215055466, -0.03340040519833565, -0.03269682824611664, -0.03199325501918793, -0.03128967806696892, -0.03058610111474991, -0.02988252602517605, -0.02917894907295704, -0.02847537398338318, -0.02777179703116417, -0.02706822194159031, -0.02636464685201645, -0.02566106989979744, -0.02495749481022358, -0.02425391972064972, -0.02355034276843071, -0.02284676767885685, -0.02214319072663784, -0.02143961563706398, -0.02073603868484497, -0.02003246359527111, -0.01932888850569725, -0.01862531341612339, -0.01792173646390438, -0.01721816137433052, -0.01651458442211151, -0.01581100933253765, -0.015107433311641216, -0.014403857290744781, -0.013700282201170921, -0.012996706180274487, -0.012293130159378052, -0.011589555069804192, -0.010885978117585182, -0.010182403028011322, -0.009478827007114887, -0.008775250986218452, -0.008071674965322018, -0.007368098944425583, -0.006664522923529148, -0.005960947368294001, -0.005257371347397566, -0.004553795326501131, -0.0038502197712659836, -0.003146643750369549, -0.002443067729473114, -0.001739491824992001, -0.001035915920510888, -0.00033234013244509697, 0.0003712358884513378, 0.0010748119093477726, 0.00177838746458292, 0.002481963485479355, 0.0031855395063757896, 0.0038891155272722244, 0.004592691548168659, 0.005296267103403807, 0.0059998431243002415, 0.006703419145196676, 0.007406994700431824, 0.008110570721328259, 0.008814146742224693]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 2.0, 6.0, 2.0, 9.0, 7.0, 9.0, 15.0, 15.0, 19.0, 29.0, 32.0, 30.0, 43.0, 48.0, 41.0, 58.0, 63.0, 61.0, 48.0, 51.0, 49.0, 50.0, 55.0, 50.0, 41.0, 38.0, 23.0, 28.0, 17.0, 12.0, 14.0, 14.0, 5.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000955045223236084, -0.0009106993675231934, -0.0008663535118103027, -0.0008220076560974121, -0.0007776618003845215, -0.0007333159446716309, -0.0006889700889587402, -0.0006446242332458496, -0.000600278377532959, -0.0005559325218200684, -0.0005115866661071777, -0.0004672408103942871, -0.0004228949546813965, -0.00037854909896850586, -0.00033420324325561523, -0.0002898573875427246, -0.000245511531829834, -0.00020116567611694336, -0.00015681982040405273, -0.00011247396469116211, -6.812810897827148e-05, -2.378225326538086e-05, 2.0563602447509766e-05, 6.490945816040039e-05, 0.00010925531387329102, 0.00015360116958618164, 0.00019794702529907227, 0.0002422928810119629, 0.0002866387367248535, 0.00033098459243774414, 0.00037533044815063477, 0.0004196763038635254, 0.000464022159576416, 0.0005083680152893066, 0.0005527138710021973, 0.0005970597267150879, 0.0006414055824279785, 0.0006857514381408691, 0.0007300972938537598, 0.0007744431495666504, 0.000818789005279541, 0.0008631348609924316, 0.0009074807167053223, 0.0009518265724182129, 0.0009961724281311035, 0.0010405182838439941, 0.0010848641395568848, 0.0011292099952697754, 0.001173555850982666, 0.0012179017066955566, 0.0012622475624084473, 0.0013065934181213379, 0.0013509392738342285, 0.0013952851295471191, 0.0014396309852600098, 0.0014839768409729004, 0.001528322696685791, 0.0015726685523986816, 0.0016170144081115723, 0.0016613602638244629, 0.0017057061195373535, 0.0017500519752502441, 0.0017943978309631348, 0.0018387436866760254, 0.001883089542388916]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 13.0, 18.0, 15.0, 23.0, 20.0, 14.0, 29.0, 26.0, 37.0, 32.0, 24.0, 44.0, 43.0, 36.0, 43.0, 33.0, 52.0, 38.0, 47.0, 43.0, 42.0, 29.0, 32.0, 31.0, 31.0, 26.0, 14.0, 24.0, 19.0, 15.0, 16.0, 8.0, 14.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.703125, -5.54095458984375, -5.3787841796875, -5.21661376953125, -5.054443359375, -4.89227294921875, -4.7301025390625, -4.56793212890625, -4.40576171875, -4.24359130859375, -4.0814208984375, -3.91925048828125, -3.757080078125, -3.59490966796875, -3.4327392578125, -3.27056884765625, -3.1083984375, -2.94622802734375, -2.7840576171875, -2.62188720703125, -2.459716796875, -2.29754638671875, -2.1353759765625, -1.97320556640625, -1.81103515625, -1.64886474609375, -1.4866943359375, -1.32452392578125, -1.162353515625, -1.00018310546875, -0.8380126953125, -0.67584228515625, -0.513671875, -0.35150146484375, -0.1893310546875, -0.02716064453125, 0.135009765625, 0.29718017578125, 0.4593505859375, 0.62152099609375, 0.78369140625, 0.94586181640625, 1.1080322265625, 1.27020263671875, 1.432373046875, 1.59454345703125, 1.7567138671875, 1.91888427734375, 2.0810546875, 2.24322509765625, 2.4053955078125, 2.56756591796875, 2.729736328125, 2.89190673828125, 3.0540771484375, 3.21624755859375, 3.37841796875, 3.54058837890625, 3.7027587890625, 3.86492919921875, 4.027099609375, 4.18927001953125, 4.3514404296875, 4.51361083984375, 4.67578125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 8.0, 10.0, 15.0, 33.0, 26.0, 28.0, 62.0, 81.0, 94.0, 150.0, 274.0, 387.0, 708.0, 1530.0, 3003.0, 7127.0, 20471.0, 72841.0, 304327.0, 470563.0, 118014.0, 30724.0, 9897.0, 4008.0, 1896.0, 901.0, 512.0, 290.0, 188.0, 109.0, 76.0, 49.0, 27.0, 25.0, 20.0, 20.0, 18.0, 11.0, 6.0, 4.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.50390625, -5.347412109375, -5.19091796875, -5.034423828125, -4.8779296875, -4.721435546875, -4.56494140625, -4.408447265625, -4.251953125, -4.095458984375, -3.93896484375, -3.782470703125, -3.6259765625, -3.469482421875, -3.31298828125, -3.156494140625, -3.0, -2.843505859375, -2.68701171875, -2.530517578125, -2.3740234375, -2.217529296875, -2.06103515625, -1.904541015625, -1.748046875, -1.591552734375, -1.43505859375, -1.278564453125, -1.1220703125, -0.965576171875, -0.80908203125, -0.652587890625, -0.49609375, -0.339599609375, -0.18310546875, -0.026611328125, 0.1298828125, 0.286376953125, 0.44287109375, 0.599365234375, 0.755859375, 0.912353515625, 1.06884765625, 1.225341796875, 1.3818359375, 1.538330078125, 1.69482421875, 1.851318359375, 2.0078125, 2.164306640625, 2.32080078125, 2.477294921875, 2.6337890625, 2.790283203125, 2.94677734375, 3.103271484375, 3.259765625, 3.416259765625, 3.57275390625, 3.729248046875, 3.8857421875, 4.042236328125, 4.19873046875, 4.355224609375, 4.51171875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 8.0, 10.0, 5.0, 14.0, 17.0, 15.0, 22.0, 21.0, 25.0, 38.0, 33.0, 38.0, 51.0, 35.0, 49.0, 73.0, 154.0, 1685.0, 263.0, 75.0, 48.0, 45.0, 35.0, 37.0, 29.0, 21.0, 27.0, 41.0, 17.0, 16.0, 23.0, 9.0, 11.0, 11.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -18.00927734375, -17.4404296875, -16.87158203125, -16.302734375, -15.73388671875, -15.1650390625, -14.59619140625, -14.02734375, -13.45849609375, -12.8896484375, -12.32080078125, -11.751953125, -11.18310546875, -10.6142578125, -10.04541015625, -9.4765625, -8.90771484375, -8.3388671875, -7.77001953125, -7.201171875, -6.63232421875, -6.0634765625, -5.49462890625, -4.92578125, -4.35693359375, -3.7880859375, -3.21923828125, -2.650390625, -2.08154296875, -1.5126953125, -0.94384765625, -0.375, 0.19384765625, 0.7626953125, 1.33154296875, 1.900390625, 2.46923828125, 3.0380859375, 3.60693359375, 4.17578125, 4.74462890625, 5.3134765625, 5.88232421875, 6.451171875, 7.02001953125, 7.5888671875, 8.15771484375, 8.7265625, 9.29541015625, 9.8642578125, 10.43310546875, 11.001953125, 11.57080078125, 12.1396484375, 12.70849609375, 13.27734375, 13.84619140625, 14.4150390625, 14.98388671875, 15.552734375, 16.12158203125, 16.6904296875, 17.25927734375, 17.828125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 6.0, 9.0, 14.0, 21.0, 22.0, 35.0, 34.0, 74.0, 94.0, 120.0, 209.0, 304.0, 584.0, 2475.0, 2533494.0, 604698.0, 2002.0, 559.0, 299.0, 185.0, 140.0, 97.0, 52.0, 42.0, 32.0, 24.0, 20.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.46875, -47.76025390625, -46.0517578125, -44.34326171875, -42.634765625, -40.92626953125, -39.2177734375, -37.50927734375, -35.80078125, -34.09228515625, -32.3837890625, -30.67529296875, -28.966796875, -27.25830078125, -25.5498046875, -23.84130859375, -22.1328125, -20.42431640625, -18.7158203125, -17.00732421875, -15.298828125, -13.59033203125, -11.8818359375, -10.17333984375, -8.46484375, -6.75634765625, -5.0478515625, -3.33935546875, -1.630859375, 0.07763671875, 1.7861328125, 3.49462890625, 5.203125, 6.91162109375, 8.6201171875, 10.32861328125, 12.037109375, 13.74560546875, 15.4541015625, 17.16259765625, 18.87109375, 20.57958984375, 22.2880859375, 23.99658203125, 25.705078125, 27.41357421875, 29.1220703125, 30.83056640625, 32.5390625, 34.24755859375, 35.9560546875, 37.66455078125, 39.373046875, 41.08154296875, 42.7900390625, 44.49853515625, 46.20703125, 47.91552734375, 49.6240234375, 51.33251953125, 53.041015625, 54.74951171875, 56.4580078125, 58.16650390625, 59.875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 1004.0, 11.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.21566390991211, -16.800312042236328, -6.38496208190918, 4.030387878417969, 14.44573974609375, 24.86109161376953, 35.27643966674805, 45.69179153442383, 56.10714340209961, 66.52249145507812, 76.9378433227539, 87.35319519042969, 97.76854705810547, 108.18389892578125, 118.5992431640625, 129.0146026611328, 139.42994689941406, 149.8452911376953, 160.26065063476562, 170.67599487304688, 181.0913543701172, 191.50669860839844, 201.92205810546875, 212.33740234375, 222.7527618408203, 233.16810607910156, 243.58346557617188, 253.99880981445312, 264.4141540527344, 274.82952880859375, 285.244873046875, 295.66021728515625, 306.0755920410156, 316.4909362792969, 326.9062805175781, 337.3216552734375, 347.73699951171875, 358.15234375, 368.56768798828125, 378.9830322265625, 389.3984069824219, 399.8137512207031, 410.2290954589844, 420.64447021484375, 431.059814453125, 441.47515869140625, 451.8905029296875, 462.30584716796875, 472.72119140625, 483.13653564453125, 493.5518798828125, 503.9672546386719, 514.382568359375, 524.7979736328125, 535.2133178710938, 545.628662109375, 556.0440063476562, 566.4593505859375, 576.8746948242188, 587.2900390625, 597.7053833007812, 608.1207885742188, 618.5361328125, 628.9514770507812, 639.3668212890625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 5.0, 6.0, 4.0, 8.0, 17.0, 16.0, 27.0, 21.0, 28.0, 17.0, 28.0, 36.0, 37.0, 45.0, 32.0, 37.0, 37.0, 44.0, 40.0, 42.0, 36.0, 41.0, 46.0, 43.0, 29.0, 35.0, 29.0, 24.0, 29.0, 29.0, 21.0, 18.0, 14.0, 17.0, 6.0, 7.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.68431854248047, -48.079673767089844, -46.475032806396484, -44.87038803100586, -43.2657470703125, -41.661102294921875, -40.05645751953125, -38.45181655883789, -36.847171783447266, -35.24252700805664, -33.63788604736328, -32.033241271972656, -30.428598403930664, -28.823955535888672, -27.21931266784668, -25.614669799804688, -24.010026931762695, -22.405384063720703, -20.80074119567871, -19.19609832763672, -17.591453552246094, -15.986810684204102, -14.38216781616211, -12.7775239944458, -11.172881126403809, -9.568238258361816, -7.963594436645508, -6.358951568603516, -4.754308223724365, -3.149664878845215, -1.5450220108032227, 0.05962181091308594, 1.6642646789550781, 3.2689080238342285, 4.873551368713379, 6.478194236755371, 8.08283805847168, 9.687480926513672, 11.292123794555664, 12.896767616271973, 14.501410484313965, 16.106054306030273, 17.710697174072266, 19.315340042114258, 20.91998291015625, 22.524627685546875, 24.129268646240234, 25.73391342163086, 27.33855628967285, 28.943199157714844, 30.547842025756836, 32.15248489379883, 33.75712966918945, 35.36177062988281, 36.96641540527344, 38.57106018066406, 40.17570114135742, 41.78034591674805, 43.384986877441406, 44.98963165283203, 46.59427261352539, 48.198917388916016, 49.803558349609375, 51.408203125, 53.012847900390625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 5.0, 13.0, 8.0, 16.0, 24.0, 22.0, 10.0, 26.0, 20.0, 23.0, 33.0, 37.0, 33.0, 43.0, 43.0, 36.0, 38.0, 45.0, 40.0, 50.0, 47.0, 29.0, 35.0, 41.0, 34.0, 28.0, 26.0, 21.0, 18.0, 23.0, 19.0, 22.0, 10.0, 18.0, 12.0, 10.0, 2.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.5234375, -5.3568115234375, -5.190185546875, -5.0235595703125, -4.85693359375, -4.6903076171875, -4.523681640625, -4.3570556640625, -4.1904296875, -4.0238037109375, -3.857177734375, -3.6905517578125, -3.52392578125, -3.3572998046875, -3.190673828125, -3.0240478515625, -2.857421875, -2.6907958984375, -2.524169921875, -2.3575439453125, -2.19091796875, -2.0242919921875, -1.857666015625, -1.6910400390625, -1.5244140625, -1.3577880859375, -1.191162109375, -1.0245361328125, -0.85791015625, -0.6912841796875, -0.524658203125, -0.3580322265625, -0.19140625, -0.0247802734375, 0.141845703125, 0.3084716796875, 0.47509765625, 0.6417236328125, 0.808349609375, 0.9749755859375, 1.1416015625, 1.3082275390625, 1.474853515625, 1.6414794921875, 1.80810546875, 1.9747314453125, 2.141357421875, 2.3079833984375, 2.474609375, 2.6412353515625, 2.807861328125, 2.9744873046875, 3.14111328125, 3.3077392578125, 3.474365234375, 3.6409912109375, 3.8076171875, 3.9742431640625, 4.140869140625, 4.3074951171875, 4.47412109375, 4.6407470703125, 4.807373046875, 4.9739990234375, 5.140625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 5.0, 14.0, 8.0, 19.0, 19.0, 22.0, 25.0, 22.0, 35.0, 43.0, 46.0, 58.0, 81.0, 101.0, 158.0, 237.0, 443.0, 1048.0, 3939.0, 21826.0, 259746.0, 2247692.0, 1522723.0, 118231.0, 12930.0, 2739.0, 878.0, 354.0, 197.0, 129.0, 95.0, 73.0, 59.0, 43.0, 46.0, 24.0, 39.0, 31.0, 23.0, 16.0, 10.0, 10.0, 6.0, 8.0, 7.0, 1.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.7265625, -12.3271484375, -11.927734375, -11.5283203125, -11.12890625, -10.7294921875, -10.330078125, -9.9306640625, -9.53125, -9.1318359375, -8.732421875, -8.3330078125, -7.93359375, -7.5341796875, -7.134765625, -6.7353515625, -6.3359375, -5.9365234375, -5.537109375, -5.1376953125, -4.73828125, -4.3388671875, -3.939453125, -3.5400390625, -3.140625, -2.7412109375, -2.341796875, -1.9423828125, -1.54296875, -1.1435546875, -0.744140625, -0.3447265625, 0.0546875, 0.4541015625, 0.853515625, 1.2529296875, 1.65234375, 2.0517578125, 2.451171875, 2.8505859375, 3.25, 3.6494140625, 4.048828125, 4.4482421875, 4.84765625, 5.2470703125, 5.646484375, 6.0458984375, 6.4453125, 6.8447265625, 7.244140625, 7.6435546875, 8.04296875, 8.4423828125, 8.841796875, 9.2412109375, 9.640625, 10.0400390625, 10.439453125, 10.8388671875, 11.23828125, 11.6376953125, 12.037109375, 12.4365234375, 12.8359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 12.0, 12.0, 23.0, 31.0, 34.0, 51.0, 53.0, 96.0, 126.0, 178.0, 247.0, 345.0, 449.0, 495.0, 438.0, 393.0, 313.0, 177.0, 154.0, 134.0, 57.0, 69.0, 46.0, 30.0, 24.0, 20.0, 13.0, 7.0, 10.0, 7.0, 9.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.231689453125, -7.88525390625, -7.538818359375, -7.1923828125, -6.845947265625, -6.49951171875, -6.153076171875, -5.806640625, -5.460205078125, -5.11376953125, -4.767333984375, -4.4208984375, -4.074462890625, -3.72802734375, -3.381591796875, -3.03515625, -2.688720703125, -2.34228515625, -1.995849609375, -1.6494140625, -1.302978515625, -0.95654296875, -0.610107421875, -0.263671875, 0.082763671875, 0.42919921875, 0.775634765625, 1.1220703125, 1.468505859375, 1.81494140625, 2.161376953125, 2.5078125, 2.854248046875, 3.20068359375, 3.547119140625, 3.8935546875, 4.239990234375, 4.58642578125, 4.932861328125, 5.279296875, 5.625732421875, 5.97216796875, 6.318603515625, 6.6650390625, 7.011474609375, 7.35791015625, 7.704345703125, 8.05078125, 8.397216796875, 8.74365234375, 9.090087890625, 9.4365234375, 9.782958984375, 10.12939453125, 10.475830078125, 10.822265625, 11.168701171875, 11.51513671875, 11.861572265625, 12.2080078125, 12.554443359375, 12.90087890625, 13.247314453125, 13.59375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 6.0, 14.0, 13.0, 18.0, 17.0, 25.0, 36.0, 44.0, 61.0, 93.0, 114.0, 149.0, 199.0, 244.0, 342.0, 596.0, 6030.0, 3808409.0, 374606.0, 1519.0, 496.0, 333.0, 209.0, 163.0, 156.0, 82.0, 81.0, 46.0, 57.0, 30.0, 22.0, 26.0, 18.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.71875, -60.0419921875, -58.365234375, -56.6884765625, -55.01171875, -53.3349609375, -51.658203125, -49.9814453125, -48.3046875, -46.6279296875, -44.951171875, -43.2744140625, -41.59765625, -39.9208984375, -38.244140625, -36.5673828125, -34.890625, -33.2138671875, -31.537109375, -29.8603515625, -28.18359375, -26.5068359375, -24.830078125, -23.1533203125, -21.4765625, -19.7998046875, -18.123046875, -16.4462890625, -14.76953125, -13.0927734375, -11.416015625, -9.7392578125, -8.0625, -6.3857421875, -4.708984375, -3.0322265625, -1.35546875, 0.3212890625, 1.998046875, 3.6748046875, 5.3515625, 7.0283203125, 8.705078125, 10.3818359375, 12.05859375, 13.7353515625, 15.412109375, 17.0888671875, 18.765625, 20.4423828125, 22.119140625, 23.7958984375, 25.47265625, 27.1494140625, 28.826171875, 30.5029296875, 32.1796875, 33.8564453125, 35.533203125, 37.2099609375, 38.88671875, 40.5634765625, 42.240234375, 43.9169921875, 45.59375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 125.0, 527.0, 316.0, 30.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.33722686767578, -102.78571319580078, -96.23420715332031, -89.68269348144531, -83.13117980957031, -76.57967376708984, -70.02816009521484, -63.47665023803711, -56.925140380859375, -50.37363052368164, -43.822120666503906, -37.270606994628906, -30.719097137451172, -24.167587280273438, -17.616073608398438, -11.064563751220703, -4.513053894042969, 2.038456916809082, 8.589967727661133, 15.1414794921875, 21.692989349365234, 28.24449920654297, 34.79601287841797, 41.3475227355957, 47.89903259277344, 54.45054244995117, 61.002052307128906, 67.5535659790039, 74.10507202148438, 80.65658569335938, 87.20809936523438, 93.75961303710938, 100.31112670898438, 106.86264038085938, 113.41414642333984, 119.96566009521484, 126.51716613769531, 133.0686798095703, 139.6201934814453, 146.1717071533203, 152.72320556640625, 159.27471923828125, 165.82623291015625, 172.37774658203125, 178.9292449951172, 185.4807586669922, 192.0322723388672, 198.5837860107422, 205.1352996826172, 211.6868133544922, 218.2383270263672, 224.78982543945312, 231.34133911132812, 237.89285278320312, 244.44436645507812, 250.99588012695312, 257.5473937988281, 264.0989074707031, 270.6504211425781, 277.2019348144531, 283.7534484863281, 290.304931640625, 296.8564453125, 303.407958984375, 309.95947265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 6.0, 11.0, 6.0, 16.0, 9.0, 13.0, 26.0, 14.0, 21.0, 24.0, 22.0, 23.0, 24.0, 34.0, 27.0, 39.0, 36.0, 36.0, 52.0, 56.0, 46.0, 38.0, 35.0, 45.0, 35.0, 38.0, 36.0, 24.0, 20.0, 30.0, 28.0, 25.0, 15.0, 12.0, 17.0, 14.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-37.34490966796875, -36.23625946044922, -35.12760925292969, -34.018959045410156, -32.910308837890625, -31.80165672302246, -30.693004608154297, -29.584354400634766, -28.475704193115234, -27.367053985595703, -26.258403778076172, -25.149751663208008, -24.041101455688477, -22.932451248168945, -21.82379913330078, -20.71514892578125, -19.60649871826172, -18.497848510742188, -17.389198303222656, -16.280546188354492, -15.171895980834961, -14.06324577331543, -12.954594612121582, -11.845943450927734, -10.737293243408203, -9.628643035888672, -8.519991874694824, -7.411341190338135, -6.302690505981445, -5.194039821624756, -4.085389137268066, -2.976738452911377, -1.8680877685546875, -0.759437084197998, 0.3492136001586914, 1.4578642845153809, 2.5665149688720703, 3.6751656532287598, 4.783816337585449, 5.892467021942139, 7.001117706298828, 8.10976791381836, 9.218419075012207, 10.327070236206055, 11.435720443725586, 12.544370651245117, 13.653021812438965, 14.761672973632812, 15.870323181152344, 16.978973388671875, 18.087623596191406, 19.19627571105957, 20.3049259185791, 21.413576126098633, 22.522228240966797, 23.630878448486328, 24.73952865600586, 25.84817886352539, 26.956829071044922, 28.065481185913086, 29.174131393432617, 30.28278160095215, 31.391433715820312, 32.500083923339844, 33.608734130859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 10.0, 6.0, 12.0, 22.0, 10.0, 15.0, 21.0, 25.0, 23.0, 18.0, 26.0, 32.0, 23.0, 29.0, 30.0, 32.0, 42.0, 40.0, 38.0, 34.0, 31.0, 43.0, 43.0, 40.0, 27.0, 16.0, 32.0, 41.0, 18.0, 26.0, 27.0, 26.0, 18.0, 15.0, 16.0, 13.0, 10.0, 9.0, 10.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.671875, -4.526611328125, -4.38134765625, -4.236083984375, -4.0908203125, -3.945556640625, -3.80029296875, -3.655029296875, -3.509765625, -3.364501953125, -3.21923828125, -3.073974609375, -2.9287109375, -2.783447265625, -2.63818359375, -2.492919921875, -2.34765625, -2.202392578125, -2.05712890625, -1.911865234375, -1.7666015625, -1.621337890625, -1.47607421875, -1.330810546875, -1.185546875, -1.040283203125, -0.89501953125, -0.749755859375, -0.6044921875, -0.459228515625, -0.31396484375, -0.168701171875, -0.0234375, 0.121826171875, 0.26708984375, 0.412353515625, 0.5576171875, 0.702880859375, 0.84814453125, 0.993408203125, 1.138671875, 1.283935546875, 1.42919921875, 1.574462890625, 1.7197265625, 1.864990234375, 2.01025390625, 2.155517578125, 2.30078125, 2.446044921875, 2.59130859375, 2.736572265625, 2.8818359375, 3.027099609375, 3.17236328125, 3.317626953125, 3.462890625, 3.608154296875, 3.75341796875, 3.898681640625, 4.0439453125, 4.189208984375, 4.33447265625, 4.479736328125, 4.625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 4.0, 12.0, 17.0, 29.0, 40.0, 54.0, 86.0, 122.0, 194.0, 265.0, 437.0, 562.0, 895.0, 1354.0, 2100.0, 2997.0, 4568.0, 6866.0, 10777.0, 16516.0, 26236.0, 42613.0, 73164.0, 129326.0, 210061.0, 207301.0, 126241.0, 70735.0, 41969.0, 25780.0, 16534.0, 10366.0, 6884.0, 4438.0, 2972.0, 2016.0, 1304.0, 897.0, 586.0, 423.0, 266.0, 167.0, 129.0, 82.0, 63.0, 37.0, 25.0, 14.0, 13.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.68115234375, -0.6591644287109375, -0.637176513671875, -0.6151885986328125, -0.59320068359375, -0.5712127685546875, -0.549224853515625, -0.5272369384765625, -0.5052490234375, -0.4832611083984375, -0.461273193359375, -0.4392852783203125, -0.41729736328125, -0.3953094482421875, -0.373321533203125, -0.3513336181640625, -0.329345703125, -0.3073577880859375, -0.285369873046875, -0.2633819580078125, -0.24139404296875, -0.2194061279296875, -0.197418212890625, -0.1754302978515625, -0.1534423828125, -0.1314544677734375, -0.109466552734375, -0.0874786376953125, -0.06549072265625, -0.0435028076171875, -0.021514892578125, 0.0004730224609375, 0.0224609375, 0.0444488525390625, 0.066436767578125, 0.0884246826171875, 0.11041259765625, 0.1324005126953125, 0.154388427734375, 0.1763763427734375, 0.1983642578125, 0.2203521728515625, 0.242340087890625, 0.2643280029296875, 0.28631591796875, 0.3083038330078125, 0.330291748046875, 0.3522796630859375, 0.374267578125, 0.3962554931640625, 0.418243408203125, 0.4402313232421875, 0.46221923828125, 0.4842071533203125, 0.506195068359375, 0.5281829833984375, 0.5501708984375, 0.5721588134765625, 0.594146728515625, 0.6161346435546875, 0.63812255859375, 0.6601104736328125, 0.682098388671875, 0.7040863037109375, 0.72607421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 4.0, 11.0, 11.0, 3.0, 12.0, 8.0, 16.0, 17.0, 25.0, 24.0, 27.0, 41.0, 24.0, 34.0, 37.0, 51.0, 35.0, 51.0, 38.0, 47.0, 1066.0, 45.0, 36.0, 46.0, 42.0, 30.0, 29.0, 29.0, 29.0, 19.0, 19.0, 24.0, 17.0, 19.0, 11.0, 10.0, 7.0, 2.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.198974609375, -3.08544921875, -2.971923828125, -2.8583984375, -2.744873046875, -2.63134765625, -2.517822265625, -2.404296875, -2.290771484375, -2.17724609375, -2.063720703125, -1.9501953125, -1.836669921875, -1.72314453125, -1.609619140625, -1.49609375, -1.382568359375, -1.26904296875, -1.155517578125, -1.0419921875, -0.928466796875, -0.81494140625, -0.701416015625, -0.587890625, -0.474365234375, -0.36083984375, -0.247314453125, -0.1337890625, -0.020263671875, 0.09326171875, 0.206787109375, 0.3203125, 0.433837890625, 0.54736328125, 0.660888671875, 0.7744140625, 0.887939453125, 1.00146484375, 1.114990234375, 1.228515625, 1.342041015625, 1.45556640625, 1.569091796875, 1.6826171875, 1.796142578125, 1.90966796875, 2.023193359375, 2.13671875, 2.250244140625, 2.36376953125, 2.477294921875, 2.5908203125, 2.704345703125, 2.81787109375, 2.931396484375, 3.044921875, 3.158447265625, 3.27197265625, 3.385498046875, 3.4990234375, 3.612548828125, 3.72607421875, 3.839599609375, 3.953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 14.0, 24.0, 26.0, 36.0, 49.0, 85.0, 146.0, 221.0, 298.0, 519.0, 837.0, 1309.0, 2011.0, 3260.0, 5034.0, 8227.0, 13573.0, 21872.0, 36436.0, 60063.0, 101874.0, 166994.0, 1259746.0, 163842.0, 99929.0, 59143.0, 35438.0, 21571.0, 12990.0, 7913.0, 4995.0, 3178.0, 1939.0, 1259.0, 765.0, 537.0, 345.0, 233.0, 127.0, 97.0, 57.0, 39.0, 25.0, 15.0, 14.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5380859375, -0.52099609375, -0.50390625, -0.48681640625, -0.4697265625, -0.45263671875, -0.435546875, -0.41845703125, -0.4013671875, -0.38427734375, -0.3671875, -0.35009765625, -0.3330078125, -0.31591796875, -0.298828125, -0.28173828125, -0.2646484375, -0.24755859375, -0.23046875, -0.21337890625, -0.1962890625, -0.17919921875, -0.162109375, -0.14501953125, -0.1279296875, -0.11083984375, -0.09375, -0.07666015625, -0.0595703125, -0.04248046875, -0.025390625, -0.00830078125, 0.0087890625, 0.02587890625, 0.04296875, 0.06005859375, 0.0771484375, 0.09423828125, 0.111328125, 0.12841796875, 0.1455078125, 0.16259765625, 0.1796875, 0.19677734375, 0.2138671875, 0.23095703125, 0.248046875, 0.26513671875, 0.2822265625, 0.29931640625, 0.31640625, 0.33349609375, 0.3505859375, 0.36767578125, 0.384765625, 0.40185546875, 0.4189453125, 0.43603515625, 0.453125, 0.47021484375, 0.4873046875, 0.50439453125, 0.521484375, 0.53857421875, 0.5556640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 11.0, 16.0, 28.0, 31.0, 51.0, 61.0, 68.0, 74.0, 115.0, 118.0, 94.0, 81.0, 62.0, 52.0, 42.0, 26.0, 17.0, 11.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.00383758544921875, -0.0037343502044677734, -0.003631114959716797, -0.0035278797149658203, -0.0034246444702148438, -0.003321409225463867, -0.0032181739807128906, -0.003114938735961914, -0.0030117034912109375, -0.002908468246459961, -0.0028052330017089844, -0.002701997756958008, -0.0025987625122070312, -0.0024955272674560547, -0.002392292022705078, -0.0022890567779541016, -0.002185821533203125, -0.0020825862884521484, -0.001979351043701172, -0.0018761157989501953, -0.0017728805541992188, -0.0016696453094482422, -0.0015664100646972656, -0.001463174819946289, -0.0013599395751953125, -0.001256704330444336, -0.0011534690856933594, -0.0010502338409423828, -0.0009469985961914062, -0.0008437633514404297, -0.0007405281066894531, -0.0006372928619384766, -0.0005340576171875, -0.00043082237243652344, -0.0003275871276855469, -0.0002243518829345703, -0.00012111663818359375, -1.7881393432617188e-05, 8.535385131835938e-05, 0.00018858909606933594, 0.0002918243408203125, 0.00039505958557128906, 0.0004982948303222656, 0.0006015300750732422, 0.0007047653198242188, 0.0008080005645751953, 0.0009112358093261719, 0.0010144710540771484, 0.001117706298828125, 0.0012209415435791016, 0.0013241767883300781, 0.0014274120330810547, 0.0015306472778320312, 0.0016338825225830078, 0.0017371177673339844, 0.001840353012084961, 0.0019435882568359375, 0.002046823501586914, 0.0021500587463378906, 0.002253293991088867, 0.0023565292358398438, 0.0024597644805908203, 0.002562999725341797, 0.0026662349700927734, 0.00276947021484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 10.0, 18.0, 28.0, 26.0, 27.0, 79.0, 88.0, 105.0, 237.0, 747.0, 131584.0, 913597.0, 1223.0, 260.0, 166.0, 102.0, 51.0, 36.0, 39.0, 34.0, 16.0, 10.0, 12.0, 10.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053619384765625, -0.05156564712524414, -0.04951190948486328, -0.04745817184448242, -0.04540443420410156, -0.0433506965637207, -0.041296958923339844, -0.039243221282958984, -0.037189483642578125, -0.035135746002197266, -0.033082008361816406, -0.031028270721435547, -0.028974533081054688, -0.026920795440673828, -0.02486705780029297, -0.02281332015991211, -0.02075958251953125, -0.01870584487915039, -0.01665210723876953, -0.014598369598388672, -0.012544631958007812, -0.010490894317626953, -0.008437156677246094, -0.006383419036865234, -0.004329681396484375, -0.0022759437561035156, -0.00022220611572265625, 0.0018315315246582031, 0.0038852691650390625, 0.005939006805419922, 0.007992744445800781, 0.01004648208618164, 0.0121002197265625, 0.01415395736694336, 0.01620769500732422, 0.018261432647705078, 0.020315170288085938, 0.022368907928466797, 0.024422645568847656, 0.026476383209228516, 0.028530120849609375, 0.030583858489990234, 0.032637596130371094, 0.03469133377075195, 0.03674507141113281, 0.03879880905151367, 0.04085254669189453, 0.04290628433227539, 0.04496002197265625, 0.04701375961303711, 0.04906749725341797, 0.05112123489379883, 0.05317497253417969, 0.05522871017456055, 0.057282447814941406, 0.059336185455322266, 0.061389923095703125, 0.06344366073608398, 0.06549739837646484, 0.0675511360168457, 0.06960487365722656, 0.07165861129760742, 0.07371234893798828, 0.07576608657836914, 0.07781982421875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 17.0, 76.0, 247.0, 429.0, 196.0, 38.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020997445099055767, -0.001942525035701692, -0.0017853055614978075, -0.001628085970878601, -0.0014708664966747165, -0.0013136470224708319, -0.0011564274318516254, -0.0009992079576477408, -0.0008419884834438562, -0.0006847690092399716, -0.0005275494768284261, -0.00037032997352071106, -0.000213110470212996, -5.5890996009111404e-05, 0.00010132853640243411, 0.0002585480688139796, 0.00041576754301786423, 0.0005729870172217488, 0.0007302065496332943, 0.0008874260820448399, 0.0010446455562487245, 0.001201865030452609, 0.0013590846210718155, 0.0015163040952757, 0.0016735235694795847, 0.0018307430436834693, 0.001987962517887354, 0.0021451821085065603, 0.0023024016991257668, 0.0024596210569143295, 0.002616840647533536, 0.0027740602381527424, 0.002931279130280018, 0.0030884987208992243, 0.003245718078687787, 0.0034029376693069935, 0.0035601570270955563, 0.0037173766177147627, 0.003874596208333969, 0.004031815566122532, 0.004189034923911095, 0.0043462542816996574, 0.0045034741051495075, 0.00466069346293807, 0.004817912820726633, 0.004975132644176483, 0.005132352001965046, 0.005289571359753609, 0.005446791183203459, 0.0056040105409920216, 0.005761230364441872, 0.005918449722230434, 0.006075669080018997, 0.00623288843780756, 0.00639010826125741, 0.006547327619045973, 0.006704547442495823, 0.006861766800284386, 0.007018986623734236, 0.0071762059815227985, 0.007333425339311361, 0.007490645162761211, 0.007647864520549774, 0.007805083878338337, 0.0079623032361269]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 5.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 18.0, 13.0, 15.0, 25.0, 26.0, 28.0, 26.0, 27.0, 34.0, 35.0, 34.0, 41.0, 40.0, 38.0, 58.0, 36.0, 37.0, 61.0, 46.0, 27.0, 49.0, 34.0, 32.0, 32.0, 25.0, 21.0, 19.0, 14.0, 15.0, 6.0, 10.0, 7.0, 3.0, 7.0, 3.0, 8.0, 12.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012882351875305176, -0.0012522926554083824, -0.0012163501232862473, -0.001180407591164112, -0.001144465059041977, -0.0011085225269198418, -0.0010725799947977066, -0.0010366374626755714, -0.0010006949305534363, -0.0009647523984313011, -0.000928809866309166, -0.0008928673341870308, -0.0008569248020648956, -0.0008209822699427605, -0.0007850397378206253, -0.0007490972056984901, -0.000713154673576355, -0.0006772121414542198, -0.0006412696093320847, -0.0006053270772099495, -0.0005693845450878143, -0.0005334420129656792, -0.000497499480843544, -0.00046155694872140884, -0.0004256144165992737, -0.0003896718844771385, -0.00035372935235500336, -0.0003177868202328682, -0.00028184428811073303, -0.00024590175598859787, -0.0002099592238664627, -0.00017401669174432755, -0.00013807415962219238, -0.00010213162750005722, -6.618909537792206e-05, -3.0246563255786896e-05, 5.695968866348267e-06, 4.163850098848343e-05, 7.758103311061859e-05, 0.00011352356523275375, 0.00014946609735488892, 0.00018540862947702408, 0.00022135116159915924, 0.0002572936937212944, 0.00029323622584342957, 0.00032917875796556473, 0.0003651212900876999, 0.00040106382220983505, 0.0004370063543319702, 0.0004729488864541054, 0.0005088914185762405, 0.0005448339506983757, 0.0005807764828205109, 0.000616719014942646, 0.0006526615470647812, 0.0006886040791869164, 0.0007245466113090515, 0.0007604891434311867, 0.0007964316755533218, 0.000832374207675457, 0.0008683167397975922, 0.0009042592719197273, 0.0009402018040418625, 0.0009761443361639977, 0.0010120868682861328]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 9.0, 6.0, 12.0, 22.0, 10.0, 15.0, 21.0, 25.0, 23.0, 18.0, 27.0, 31.0, 23.0, 29.0, 30.0, 32.0, 42.0, 40.0, 38.0, 34.0, 31.0, 43.0, 43.0, 40.0, 27.0, 16.0, 32.0, 41.0, 18.0, 26.0, 27.0, 26.0, 18.0, 15.0, 16.0, 13.0, 10.0, 9.0, 10.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.671875, -4.526611328125, -4.38134765625, -4.236083984375, -4.0908203125, -3.945556640625, -3.80029296875, -3.655029296875, -3.509765625, -3.364501953125, -3.21923828125, -3.073974609375, -2.9287109375, -2.783447265625, -2.63818359375, -2.492919921875, -2.34765625, -2.202392578125, -2.05712890625, -1.911865234375, -1.7666015625, -1.621337890625, -1.47607421875, -1.330810546875, -1.185546875, -1.040283203125, -0.89501953125, -0.749755859375, -0.6044921875, -0.459228515625, -0.31396484375, -0.168701171875, -0.0234375, 0.121826171875, 0.26708984375, 0.412353515625, 0.5576171875, 0.702880859375, 0.84814453125, 0.993408203125, 1.138671875, 1.283935546875, 1.42919921875, 1.574462890625, 1.7197265625, 1.864990234375, 2.01025390625, 2.155517578125, 2.30078125, 2.446044921875, 2.59130859375, 2.736572265625, 2.8818359375, 3.027099609375, 3.17236328125, 3.317626953125, 3.462890625, 3.608154296875, 3.75341796875, 3.898681640625, 4.0439453125, 4.189208984375, 4.33447265625, 4.479736328125, 4.625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 24.0, 30.0, 43.0, 76.0, 118.0, 234.0, 391.0, 717.0, 1266.0, 2344.0, 4497.0, 8878.0, 17892.0, 39031.0, 91389.0, 229988.0, 372269.0, 158668.0, 64371.0, 28452.0, 13532.0, 6610.0, 3503.0, 1777.0, 996.0, 532.0, 342.0, 191.0, 110.0, 64.0, 48.0, 23.0, 20.0, 17.0, 9.0, 6.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0], "bins": [-3.458984375, -3.351898193359375, -3.24481201171875, -3.137725830078125, -3.0306396484375, -2.923553466796875, -2.81646728515625, -2.709381103515625, -2.602294921875, -2.495208740234375, -2.38812255859375, -2.281036376953125, -2.1739501953125, -2.066864013671875, -1.95977783203125, -1.852691650390625, -1.74560546875, -1.638519287109375, -1.53143310546875, -1.424346923828125, -1.3172607421875, -1.210174560546875, -1.10308837890625, -0.996002197265625, -0.888916015625, -0.781829833984375, -0.67474365234375, -0.567657470703125, -0.4605712890625, -0.353485107421875, -0.24639892578125, -0.139312744140625, -0.0322265625, 0.074859619140625, 0.18194580078125, 0.289031982421875, 0.3961181640625, 0.503204345703125, 0.61029052734375, 0.717376708984375, 0.824462890625, 0.931549072265625, 1.03863525390625, 1.145721435546875, 1.2528076171875, 1.359893798828125, 1.46697998046875, 1.574066162109375, 1.68115234375, 1.788238525390625, 1.89532470703125, 2.002410888671875, 2.1094970703125, 2.216583251953125, 2.32366943359375, 2.430755615234375, 2.537841796875, 2.644927978515625, 2.75201416015625, 2.859100341796875, 2.9661865234375, 3.073272705078125, 3.18035888671875, 3.287445068359375, 3.39453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 3.0, 27.0, 19.0, 14.0, 13.0, 23.0, 35.0, 26.0, 38.0, 46.0, 50.0, 51.0, 87.0, 164.0, 1587.0, 300.0, 92.0, 59.0, 64.0, 49.0, 45.0, 25.0, 33.0, 26.0, 23.0, 31.0, 21.0, 12.0, 10.0, 7.0, 7.0, 7.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.984375, -17.417236328125, -16.85009765625, -16.282958984375, -15.7158203125, -15.148681640625, -14.58154296875, -14.014404296875, -13.447265625, -12.880126953125, -12.31298828125, -11.745849609375, -11.1787109375, -10.611572265625, -10.04443359375, -9.477294921875, -8.91015625, -8.343017578125, -7.77587890625, -7.208740234375, -6.6416015625, -6.074462890625, -5.50732421875, -4.940185546875, -4.373046875, -3.805908203125, -3.23876953125, -2.671630859375, -2.1044921875, -1.537353515625, -0.97021484375, -0.403076171875, 0.1640625, 0.731201171875, 1.29833984375, 1.865478515625, 2.4326171875, 2.999755859375, 3.56689453125, 4.134033203125, 4.701171875, 5.268310546875, 5.83544921875, 6.402587890625, 6.9697265625, 7.536865234375, 8.10400390625, 8.671142578125, 9.23828125, 9.805419921875, 10.37255859375, 10.939697265625, 11.5068359375, 12.073974609375, 12.64111328125, 13.208251953125, 13.775390625, 14.342529296875, 14.90966796875, 15.476806640625, 16.0439453125, 16.611083984375, 17.17822265625, 17.745361328125, 18.3125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 19.0, 29.0, 37.0, 48.0, 58.0, 64.0, 72.0, 123.0, 148.0, 237.0, 341.0, 680.0, 3343.0, 2052661.0, 1082959.0, 3023.0, 625.0, 326.0, 233.0, 139.0, 131.0, 99.0, 56.0, 40.0, 22.0, 23.0, 33.0, 21.0, 8.0, 21.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.8779296875, -41.537109375, -40.1962890625, -38.85546875, -37.5146484375, -36.173828125, -34.8330078125, -33.4921875, -32.1513671875, -30.810546875, -29.4697265625, -28.12890625, -26.7880859375, -25.447265625, -24.1064453125, -22.765625, -21.4248046875, -20.083984375, -18.7431640625, -17.40234375, -16.0615234375, -14.720703125, -13.3798828125, -12.0390625, -10.6982421875, -9.357421875, -8.0166015625, -6.67578125, -5.3349609375, -3.994140625, -2.6533203125, -1.3125, 0.0283203125, 1.369140625, 2.7099609375, 4.05078125, 5.3916015625, 6.732421875, 8.0732421875, 9.4140625, 10.7548828125, 12.095703125, 13.4365234375, 14.77734375, 16.1181640625, 17.458984375, 18.7998046875, 20.140625, 21.4814453125, 22.822265625, 24.1630859375, 25.50390625, 26.8447265625, 28.185546875, 29.5263671875, 30.8671875, 32.2080078125, 33.548828125, 34.8896484375, 36.23046875, 37.5712890625, 38.912109375, 40.2529296875, 41.59375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 139.0, 506.0, 322.0, 38.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.318716049194336, -15.096857070922852, -12.874998092651367, -10.653138160705566, -8.431279182434082, -6.209420204162598, -3.987560272216797, -1.7657012939453125, 0.4561576843261719, 2.6780169010162354, 4.899876117706299, 7.121735572814941, 9.343594551086426, 11.56545352935791, 13.787313461303711, 16.009172439575195, 18.23103141784668, 20.452890396118164, 22.67474937438965, 24.896610260009766, 27.11846923828125, 29.340328216552734, 31.56218719482422, 33.7840461730957, 36.00590515136719, 38.22776412963867, 40.449623107910156, 42.67148208618164, 44.893341064453125, 47.11520004272461, 49.337059020996094, 51.558921813964844, 53.78077697753906, 56.00263595581055, 58.22449493408203, 60.446353912353516, 62.668212890625, 64.89007568359375, 67.11193084716797, 69.33379364013672, 71.55564880371094, 73.77751159667969, 75.9993667602539, 78.22122955322266, 80.44308471679688, 82.66494750976562, 84.88680267333984, 87.1086654663086, 89.33052062988281, 91.55238342285156, 93.77423858642578, 95.99610137939453, 98.21795654296875, 100.4398193359375, 102.66167449951172, 104.88353729248047, 107.10540008544922, 109.32726287841797, 111.54911804199219, 113.77098083496094, 115.99283599853516, 118.2146987915039, 120.43655395507812, 122.65841674804688, 124.8802719116211]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 6.0, 8.0, 12.0, 9.0, 12.0, 10.0, 22.0, 25.0, 33.0, 26.0, 33.0, 20.0, 24.0, 36.0, 35.0, 42.0, 38.0, 32.0, 35.0, 26.0, 30.0, 39.0, 32.0, 43.0, 38.0, 29.0, 28.0, 21.0, 23.0, 23.0, 31.0, 10.0, 20.0, 21.0, 18.0, 14.0, 15.0, 14.0, 11.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.85610580444336, -37.63048553466797, -36.40486145019531, -35.17924118041992, -33.95362091064453, -32.72800064086914, -31.502378463745117, -30.276756286621094, -29.051136016845703, -27.825515747070312, -26.59989356994629, -25.374271392822266, -24.148651123046875, -22.923030853271484, -21.69740867614746, -20.471786499023438, -19.246166229248047, -18.020545959472656, -16.794923782348633, -15.569302558898926, -14.343681335449219, -13.118060111999512, -11.892438888549805, -10.666817665100098, -9.44119644165039, -8.215575218200684, -6.989953994750977, -5.7643327713012695, -4.5387115478515625, -3.3130903244018555, -2.0874691009521484, -0.8618478775024414, 0.36377716064453125, 1.5893983840942383, 2.8150196075439453, 4.040640830993652, 5.266262054443359, 6.491883277893066, 7.717504501342773, 8.94312572479248, 10.168746948242188, 11.394368171691895, 12.619989395141602, 13.845610618591309, 15.071231842041016, 16.296852111816406, 17.52247428894043, 18.748096466064453, 19.973716735839844, 21.199337005615234, 22.424959182739258, 23.65058135986328, 24.876201629638672, 26.101821899414062, 27.327444076538086, 28.55306625366211, 29.7786865234375, 31.00430679321289, 32.22992706298828, 33.45555114746094, 34.68117141723633, 35.90679168701172, 37.132415771484375, 38.358036041259766, 39.583656311035156]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 14.0, 10.0, 9.0, 14.0, 14.0, 19.0, 35.0, 23.0, 28.0, 19.0, 25.0, 33.0, 38.0, 41.0, 24.0, 37.0, 33.0, 40.0, 46.0, 34.0, 44.0, 31.0, 34.0, 24.0, 24.0, 37.0, 25.0, 34.0, 14.0, 29.0, 24.0, 24.0, 12.0, 10.0, 8.0, 17.0, 11.0, 14.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.8828125, -4.72821044921875, -4.5736083984375, -4.41900634765625, -4.264404296875, -4.10980224609375, -3.9552001953125, -3.80059814453125, -3.64599609375, -3.49139404296875, -3.3367919921875, -3.18218994140625, -3.027587890625, -2.87298583984375, -2.7183837890625, -2.56378173828125, -2.4091796875, -2.25457763671875, -2.0999755859375, -1.94537353515625, -1.790771484375, -1.63616943359375, -1.4815673828125, -1.32696533203125, -1.17236328125, -1.01776123046875, -0.8631591796875, -0.70855712890625, -0.553955078125, -0.39935302734375, -0.2447509765625, -0.09014892578125, 0.064453125, 0.21905517578125, 0.3736572265625, 0.52825927734375, 0.682861328125, 0.83746337890625, 0.9920654296875, 1.14666748046875, 1.30126953125, 1.45587158203125, 1.6104736328125, 1.76507568359375, 1.919677734375, 2.07427978515625, 2.2288818359375, 2.38348388671875, 2.5380859375, 2.69268798828125, 2.8472900390625, 3.00189208984375, 3.156494140625, 3.31109619140625, 3.4656982421875, 3.62030029296875, 3.77490234375, 3.92950439453125, 4.0841064453125, 4.23870849609375, 4.393310546875, 4.54791259765625, 4.7025146484375, 4.85711669921875, 5.01171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 9.0, 12.0, 13.0, 12.0, 11.0, 19.0, 22.0, 26.0, 31.0, 38.0, 46.0, 61.0, 133.0, 294.0, 543.0, 1902.0, 9547.0, 128996.0, 2484533.0, 1501858.0, 57332.0, 6230.0, 1378.0, 510.0, 260.0, 120.0, 61.0, 43.0, 36.0, 27.0, 14.0, 25.0, 18.0, 17.0, 12.0, 17.0, 14.0, 6.0, 7.0, 9.0, 6.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.4288330078125, -14.912353515625, -14.3958740234375, -13.87939453125, -13.3629150390625, -12.846435546875, -12.3299560546875, -11.8134765625, -11.2969970703125, -10.780517578125, -10.2640380859375, -9.74755859375, -9.2310791015625, -8.714599609375, -8.1981201171875, -7.681640625, -7.1651611328125, -6.648681640625, -6.1322021484375, -5.61572265625, -5.0992431640625, -4.582763671875, -4.0662841796875, -3.5498046875, -3.0333251953125, -2.516845703125, -2.0003662109375, -1.48388671875, -0.9674072265625, -0.450927734375, 0.0655517578125, 0.58203125, 1.0985107421875, 1.614990234375, 2.1314697265625, 2.64794921875, 3.1644287109375, 3.680908203125, 4.1973876953125, 4.7138671875, 5.2303466796875, 5.746826171875, 6.2633056640625, 6.77978515625, 7.2962646484375, 7.812744140625, 8.3292236328125, 8.845703125, 9.3621826171875, 9.878662109375, 10.3951416015625, 10.91162109375, 11.4281005859375, 11.944580078125, 12.4610595703125, 12.9775390625, 13.4940185546875, 14.010498046875, 14.5269775390625, 15.04345703125, 15.5599365234375, 16.076416015625, 16.5928955078125, 17.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 13.0, 18.0, 17.0, 37.0, 51.0, 65.0, 100.0, 164.0, 212.0, 342.0, 447.0, 616.0, 559.0, 434.0, 298.0, 206.0, 158.0, 111.0, 55.0, 56.0, 31.0, 26.0, 16.0, 10.0, 8.0, 4.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.5234375, -15.1141357421875, -14.704833984375, -14.2955322265625, -13.88623046875, -13.4769287109375, -13.067626953125, -12.6583251953125, -12.2490234375, -11.8397216796875, -11.430419921875, -11.0211181640625, -10.61181640625, -10.2025146484375, -9.793212890625, -9.3839111328125, -8.974609375, -8.5653076171875, -8.156005859375, -7.7467041015625, -7.33740234375, -6.9281005859375, -6.518798828125, -6.1094970703125, -5.7001953125, -5.2908935546875, -4.881591796875, -4.4722900390625, -4.06298828125, -3.6536865234375, -3.244384765625, -2.8350830078125, -2.42578125, -2.0164794921875, -1.607177734375, -1.1978759765625, -0.78857421875, -0.3792724609375, 0.030029296875, 0.4393310546875, 0.8486328125, 1.2579345703125, 1.667236328125, 2.0765380859375, 2.48583984375, 2.8951416015625, 3.304443359375, 3.7137451171875, 4.123046875, 4.5323486328125, 4.941650390625, 5.3509521484375, 5.76025390625, 6.1695556640625, 6.578857421875, 6.9881591796875, 7.3974609375, 7.8067626953125, 8.216064453125, 8.6253662109375, 9.03466796875, 9.4439697265625, 9.853271484375, 10.2625732421875, 10.671875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 11.0, 7.0, 17.0, 24.0, 36.0, 56.0, 76.0, 102.0, 166.0, 241.0, 325.0, 473.0, 1738.0, 2380961.0, 1806839.0, 1692.0, 495.0, 279.0, 225.0, 151.0, 122.0, 84.0, 52.0, 36.0, 28.0, 22.0, 13.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.716796875, -62.55859375, -60.400390625, -58.2421875, -56.083984375, -53.92578125, -51.767578125, -49.609375, -47.451171875, -45.29296875, -43.134765625, -40.9765625, -38.818359375, -36.66015625, -34.501953125, -32.34375, -30.185546875, -28.02734375, -25.869140625, -23.7109375, -21.552734375, -19.39453125, -17.236328125, -15.078125, -12.919921875, -10.76171875, -8.603515625, -6.4453125, -4.287109375, -2.12890625, 0.029296875, 2.1875, 4.345703125, 6.50390625, 8.662109375, 10.8203125, 12.978515625, 15.13671875, 17.294921875, 19.453125, 21.611328125, 23.76953125, 25.927734375, 28.0859375, 30.244140625, 32.40234375, 34.560546875, 36.71875, 38.876953125, 41.03515625, 43.193359375, 45.3515625, 47.509765625, 49.66796875, 51.826171875, 53.984375, 56.142578125, 58.30078125, 60.458984375, 62.6171875, 64.775390625, 66.93359375, 69.091796875, 71.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 15.0, 150.0, 313.0, 374.0, 133.0, 27.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.8953399658203, -167.4841766357422, -163.072998046875, -158.66183471679688, -154.2506561279297, -149.83949279785156, -145.42831420898438, -141.01715087890625, -136.60598754882812, -132.19482421875, -127.78364562988281, -123.37247467041016, -118.9613037109375, -114.55014038085938, -110.13896942138672, -105.72779846191406, -101.31661987304688, -96.90544891357422, -92.49427795410156, -88.0831069946289, -83.67193603515625, -79.26077270507812, -74.84960174560547, -70.43843078613281, -66.02725982666016, -61.6160888671875, -57.204917907714844, -52.79375076293945, -48.3825798034668, -43.97140884399414, -39.56024169921875, -35.149070739746094, -30.737884521484375, -26.32671356201172, -21.915544509887695, -17.504375457763672, -13.093204498291016, -8.68203353881836, -4.270864486694336, 0.1403045654296875, 4.551475524902344, 8.962645530700684, 13.373815536499023, 17.784984588623047, 22.196155548095703, 26.60732650756836, 31.018495559692383, 35.429664611816406, 39.84083557128906, 44.25200653076172, 48.663177490234375, 53.074344635009766, 57.48551559448242, 61.89668655395508, 66.30785369873047, 70.71902465820312, 75.13019561767578, 79.54136657714844, 83.9525375366211, 88.36370849609375, 92.77487182617188, 97.18605041503906, 101.59721374511719, 106.00838470458984, 110.4195556640625]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 9.0, 3.0, 2.0, 8.0, 7.0, 14.0, 15.0, 14.0, 16.0, 20.0, 21.0, 24.0, 13.0, 21.0, 31.0, 33.0, 24.0, 34.0, 27.0, 25.0, 33.0, 39.0, 50.0, 46.0, 44.0, 37.0, 28.0, 42.0, 37.0, 30.0, 26.0, 27.0, 26.0, 17.0, 17.0, 19.0, 26.0, 17.0, 13.0, 15.0, 8.0, 15.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-32.211605072021484, -31.25213050842285, -30.29265785217285, -29.33318328857422, -28.373708724975586, -27.414234161376953, -26.454761505126953, -25.49528694152832, -24.535812377929688, -23.576337814331055, -22.616865158081055, -21.657390594482422, -20.69791603088379, -19.738441467285156, -18.778968811035156, -17.819494247436523, -16.86001968383789, -15.900546073913574, -14.941071510314941, -13.981597900390625, -13.022123336791992, -12.062649726867676, -11.10317611694336, -10.143701553344727, -9.184228897094727, -8.22475528717041, -7.265280723571777, -6.305807113647461, -5.346332550048828, -4.386858940124512, -3.427384853363037, -2.4679107666015625, -1.5084362030029297, -0.5489621758460999, 0.41051185131073, 1.369985818862915, 2.3294599056243896, 3.288933753967285, 4.24840784072876, 5.207881927490234, 6.167356014251709, 7.126830101013184, 8.0863037109375, 9.045778274536133, 10.00525188446045, 10.964725494384766, 11.924200057983398, 12.883674621582031, 13.843148231506348, 14.802621841430664, 15.762096405029297, 16.72157096862793, 17.68104362487793, 18.640518188476562, 19.599992752075195, 20.559467315673828, 21.518939971923828, 22.47841453552246, 23.43788719177246, 24.397361755371094, 25.356836318969727, 26.31631088256836, 27.27578353881836, 28.235258102416992, 29.194732666015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 7.0, 9.0, 15.0, 20.0, 21.0, 27.0, 26.0, 19.0, 33.0, 35.0, 30.0, 26.0, 37.0, 40.0, 36.0, 45.0, 42.0, 36.0, 39.0, 42.0, 40.0, 38.0, 19.0, 35.0, 30.0, 28.0, 33.0, 22.0, 18.0, 17.0, 15.0, 19.0, 9.0, 10.0, 10.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.08984375, -4.93060302734375, -4.7713623046875, -4.61212158203125, -4.452880859375, -4.29364013671875, -4.1343994140625, -3.97515869140625, -3.81591796875, -3.65667724609375, -3.4974365234375, -3.33819580078125, -3.178955078125, -3.01971435546875, -2.8604736328125, -2.70123291015625, -2.5419921875, -2.38275146484375, -2.2235107421875, -2.06427001953125, -1.905029296875, -1.74578857421875, -1.5865478515625, -1.42730712890625, -1.26806640625, -1.10882568359375, -0.9495849609375, -0.79034423828125, -0.631103515625, -0.47186279296875, -0.3126220703125, -0.15338134765625, 0.005859375, 0.16510009765625, 0.3243408203125, 0.48358154296875, 0.642822265625, 0.80206298828125, 0.9613037109375, 1.12054443359375, 1.27978515625, 1.43902587890625, 1.5982666015625, 1.75750732421875, 1.916748046875, 2.07598876953125, 2.2352294921875, 2.39447021484375, 2.5537109375, 2.71295166015625, 2.8721923828125, 3.03143310546875, 3.190673828125, 3.34991455078125, 3.5091552734375, 3.66839599609375, 3.82763671875, 3.98687744140625, 4.1461181640625, 4.30535888671875, 4.464599609375, 4.62384033203125, 4.7830810546875, 4.94232177734375, 5.1015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 10.0, 30.0, 31.0, 66.0, 78.0, 125.0, 168.0, 226.0, 348.0, 507.0, 659.0, 953.0, 1333.0, 1930.0, 2742.0, 4001.0, 5730.0, 8002.0, 11863.0, 18048.0, 27550.0, 43047.0, 67855.0, 109272.0, 166491.0, 188395.0, 140193.0, 88111.0, 55328.0, 34726.0, 22698.0, 15370.0, 9985.0, 6825.0, 4697.0, 3250.0, 2343.0, 1644.0, 1180.0, 825.0, 583.0, 408.0, 294.0, 185.0, 159.0, 82.0, 62.0, 65.0, 24.0, 14.0, 14.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.6044921875, -0.5857620239257812, -0.5670318603515625, -0.5483016967773438, -0.529571533203125, -0.5108413696289062, -0.4921112060546875, -0.47338104248046875, -0.45465087890625, -0.43592071533203125, -0.4171905517578125, -0.39846038818359375, -0.379730224609375, -0.36100006103515625, -0.3422698974609375, -0.32353973388671875, -0.3048095703125, -0.28607940673828125, -0.2673492431640625, -0.24861907958984375, -0.229888916015625, -0.21115875244140625, -0.1924285888671875, -0.17369842529296875, -0.15496826171875, -0.13623809814453125, -0.1175079345703125, -0.09877777099609375, -0.080047607421875, -0.06131744384765625, -0.0425872802734375, -0.02385711669921875, -0.005126953125, 0.01360321044921875, 0.0323333740234375, 0.05106353759765625, 0.069793701171875, 0.08852386474609375, 0.1072540283203125, 0.12598419189453125, 0.14471435546875, 0.16344451904296875, 0.1821746826171875, 0.20090484619140625, 0.219635009765625, 0.23836517333984375, 0.2570953369140625, 0.27582550048828125, 0.2945556640625, 0.31328582763671875, 0.3320159912109375, 0.35074615478515625, 0.369476318359375, 0.38820648193359375, 0.4069366455078125, 0.42566680908203125, 0.44439697265625, 0.46312713623046875, 0.4818572998046875, 0.5005874633789062, 0.519317626953125, 0.5380477905273438, 0.5567779541015625, 0.5755081176757812, 0.59423828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 9.0, 10.0, 9.0, 18.0, 19.0, 23.0, 22.0, 20.0, 26.0, 27.0, 31.0, 41.0, 36.0, 49.0, 41.0, 45.0, 48.0, 1077.0, 32.0, 44.0, 42.0, 30.0, 31.0, 38.0, 27.0, 27.0, 34.0, 21.0, 23.0, 21.0, 12.0, 17.0, 19.0, 7.0, 12.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.155242919921875, -3.04290771484375, -2.930572509765625, -2.8182373046875, -2.705902099609375, -2.59356689453125, -2.481231689453125, -2.368896484375, -2.256561279296875, -2.14422607421875, -2.031890869140625, -1.9195556640625, -1.807220458984375, -1.69488525390625, -1.582550048828125, -1.47021484375, -1.357879638671875, -1.24554443359375, -1.133209228515625, -1.0208740234375, -0.908538818359375, -0.79620361328125, -0.683868408203125, -0.571533203125, -0.459197998046875, -0.34686279296875, -0.234527587890625, -0.1221923828125, -0.009857177734375, 0.10247802734375, 0.214813232421875, 0.3271484375, 0.439483642578125, 0.55181884765625, 0.664154052734375, 0.7764892578125, 0.888824462890625, 1.00115966796875, 1.113494873046875, 1.225830078125, 1.338165283203125, 1.45050048828125, 1.562835693359375, 1.6751708984375, 1.787506103515625, 1.89984130859375, 2.012176513671875, 2.12451171875, 2.236846923828125, 2.34918212890625, 2.461517333984375, 2.5738525390625, 2.686187744140625, 2.79852294921875, 2.910858154296875, 3.023193359375, 3.135528564453125, 3.24786376953125, 3.360198974609375, 3.4725341796875, 3.584869384765625, 3.69720458984375, 3.809539794921875, 3.921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 16.0, 13.0, 23.0, 36.0, 62.0, 98.0, 119.0, 184.0, 320.0, 473.0, 819.0, 1387.0, 2196.0, 3568.0, 5995.0, 10509.0, 17943.0, 31681.0, 56319.0, 102264.0, 182842.0, 1287907.0, 172185.0, 95889.0, 52859.0, 30062.0, 16790.0, 9908.0, 5733.0, 3442.0, 2028.0, 1228.0, 782.0, 520.0, 316.0, 211.0, 127.0, 83.0, 56.0, 31.0, 44.0, 16.0, 12.0, 6.0, 9.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6690521240234375, -0.649627685546875, -0.6302032470703125, -0.61077880859375, -0.5913543701171875, -0.571929931640625, -0.5525054931640625, -0.5330810546875, -0.5136566162109375, -0.494232177734375, -0.4748077392578125, -0.45538330078125, -0.4359588623046875, -0.416534423828125, -0.3971099853515625, -0.377685546875, -0.3582611083984375, -0.338836669921875, -0.3194122314453125, -0.29998779296875, -0.2805633544921875, -0.261138916015625, -0.2417144775390625, -0.2222900390625, -0.2028656005859375, -0.183441162109375, -0.1640167236328125, -0.14459228515625, -0.1251678466796875, -0.105743408203125, -0.0863189697265625, -0.06689453125, -0.0474700927734375, -0.028045654296875, -0.0086212158203125, 0.01080322265625, 0.0302276611328125, 0.049652099609375, 0.0690765380859375, 0.0885009765625, 0.1079254150390625, 0.127349853515625, 0.1467742919921875, 0.16619873046875, 0.1856231689453125, 0.205047607421875, 0.2244720458984375, 0.243896484375, 0.2633209228515625, 0.282745361328125, 0.3021697998046875, 0.32159423828125, 0.3410186767578125, 0.360443115234375, 0.3798675537109375, 0.3992919921875, 0.4187164306640625, 0.438140869140625, 0.4575653076171875, 0.47698974609375, 0.4964141845703125, 0.515838623046875, 0.5352630615234375, 0.5546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 10.0, 9.0, 12.0, 11.0, 12.0, 17.0, 33.0, 33.0, 32.0, 52.0, 32.0, 38.0, 59.0, 60.0, 60.0, 65.0, 71.0, 57.0, 55.0, 36.0, 45.0, 35.0, 29.0, 29.0, 22.0, 12.0, 12.0, 13.0, 10.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00212860107421875, -0.0020547211170196533, -0.0019808411598205566, -0.00190696120262146, -0.0018330812454223633, -0.0017592012882232666, -0.00168532133102417, -0.0016114413738250732, -0.0015375614166259766, -0.0014636814594268799, -0.0013898015022277832, -0.0013159215450286865, -0.0012420415878295898, -0.0011681616306304932, -0.0010942816734313965, -0.0010204017162322998, -0.0009465217590332031, -0.0008726418018341064, -0.0007987618446350098, -0.0007248818874359131, -0.0006510019302368164, -0.0005771219730377197, -0.000503242015838623, -0.00042936205863952637, -0.0003554821014404297, -0.000281602144241333, -0.00020772218704223633, -0.00013384222984313965, -5.996227264404297e-05, 1.3917684555053711e-05, 8.779764175415039e-05, 0.00016167759895324707, 0.00023555755615234375, 0.00030943751335144043, 0.0003833174705505371, 0.0004571974277496338, 0.0005310773849487305, 0.0006049573421478271, 0.0006788372993469238, 0.0007527172565460205, 0.0008265972137451172, 0.0009004771709442139, 0.0009743571281433105, 0.0010482370853424072, 0.001122117042541504, 0.0011959969997406006, 0.0012698769569396973, 0.001343756914138794, 0.0014176368713378906, 0.0014915168285369873, 0.001565396785736084, 0.0016392767429351807, 0.0017131567001342773, 0.001787036657333374, 0.0018609166145324707, 0.0019347965717315674, 0.002008676528930664, 0.0020825564861297607, 0.0021564364433288574, 0.002230316400527954, 0.0023041963577270508, 0.0023780763149261475, 0.002451956272125244, 0.002525836229324341, 0.0025997161865234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 8.0, 13.0, 15.0, 23.0, 21.0, 22.0, 29.0, 46.0, 62.0, 84.0, 102.0, 127.0, 261.0, 478.0, 2157.0, 951446.0, 91648.0, 1013.0, 332.0, 170.0, 108.0, 79.0, 64.0, 65.0, 40.0, 25.0, 23.0, 16.0, 13.0, 17.0, 8.0, 5.0, 1.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056527137756347656, -0.05494880676269531, -0.05337047576904297, -0.051792144775390625, -0.05021381378173828, -0.04863548278808594, -0.047057151794433594, -0.04547882080078125, -0.043900489807128906, -0.04232215881347656, -0.04074382781982422, -0.039165496826171875, -0.03758716583251953, -0.03600883483886719, -0.034430503845214844, -0.0328521728515625, -0.031273841857910156, -0.029695510864257812, -0.02811717987060547, -0.026538848876953125, -0.02496051788330078, -0.023382186889648438, -0.021803855895996094, -0.02022552490234375, -0.018647193908691406, -0.017068862915039062, -0.015490531921386719, -0.013912200927734375, -0.012333869934082031, -0.010755538940429688, -0.009177207946777344, -0.007598876953125, -0.006020545959472656, -0.0044422149658203125, -0.0028638839721679688, -0.001285552978515625, 0.00029277801513671875, 0.0018711090087890625, 0.0034494400024414062, 0.00502777099609375, 0.006606101989746094, 0.008184432983398438, 0.009762763977050781, 0.011341094970703125, 0.012919425964355469, 0.014497756958007812, 0.016076087951660156, 0.0176544189453125, 0.019232749938964844, 0.020811080932617188, 0.02238941192626953, 0.023967742919921875, 0.02554607391357422, 0.027124404907226562, 0.028702735900878906, 0.03028106689453125, 0.031859397888183594, 0.03343772888183594, 0.03501605987548828, 0.036594390869140625, 0.03817272186279297, 0.03975105285644531, 0.041329383850097656, 0.04290771484375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 65.0, 936.0, 18.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0337277427315712, -0.033129896968603134, -0.03253204748034477, -0.03193420171737671, -0.031336355954408646, -0.030738508328795433, -0.03014066256582737, -0.029542814940214157, -0.028944969177246094, -0.02834712155163288, -0.027749275788664818, -0.027151428163051605, -0.026553582400083542, -0.02595573477447033, -0.025357889011502266, -0.024760041385889053, -0.02416219376027584, -0.023564346134662628, -0.022966500371694565, -0.022368652746081352, -0.02177080698311329, -0.021172959357500076, -0.020575113594532013, -0.0199772659689188, -0.019379418343305588, -0.018781570717692375, -0.018183724954724312, -0.0175858773291111, -0.016988031566143036, -0.016390183940529823, -0.01579233817756176, -0.015194490551948547, -0.014596642926335335, -0.013998796232044697, -0.013400949537754059, -0.012803102843463421, -0.012205256149172783, -0.01160740852355957, -0.011009561829268932, -0.010411715134978294, -0.009813869372010231, -0.009216022677719593, -0.008618175983428955, -0.008020329289138317, -0.007422482129186392, -0.006824635434895754, -0.006226788274943829, -0.005628941580653191, -0.005031094420701265, -0.004433247726410627, -0.0038354007992893457, -0.003237553872168064, -0.002639707177877426, -0.002041860483586788, -0.0014440135564655066, -0.0008461666293442249, -0.00024831993505358696, 0.00034952687565237284, 0.0009473736863583326, 0.0015452204970642924, 0.0021430673077702522, 0.00274091400206089, 0.003338760929182172, 0.0039366078563034534, 0.004534454550594091]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 6.0, 12.0, 7.0, 14.0, 24.0, 11.0, 23.0, 37.0, 36.0, 38.0, 33.0, 46.0, 52.0, 54.0, 46.0, 43.0, 47.0, 51.0, 46.0, 46.0, 56.0, 42.0, 32.0, 23.0, 32.0, 30.0, 18.0, 20.0, 19.0, 14.0, 10.0, 10.0, 6.0, 5.0, 8.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012114644050598145, -0.001164414919912815, -0.0011173654347658157, -0.0010703159496188164, -0.001023266464471817, -0.0009762169793248177, -0.0009291674941778183, -0.0008821180090308189, -0.0008350685238838196, -0.0007880190387368202, -0.0007409695535898209, -0.0006939200684428215, -0.0006468705832958221, -0.0005998210981488228, -0.0005527716130018234, -0.0005057221278548241, -0.0004586726427078247, -0.00041162315756082535, -0.000364573672413826, -0.00031752418726682663, -0.00027047470211982727, -0.0002234252169728279, -0.00017637573182582855, -0.0001293262466788292, -8.227676153182983e-05, -3.5227276384830475e-05, 1.1822208762168884e-05, 5.8871693909168243e-05, 0.0001059211790561676, 0.00015297066420316696, 0.00020002014935016632, 0.0002470696344971657, 0.00029411911964416504, 0.0003411686047911644, 0.00038821808993816376, 0.0004352675750851631, 0.0004823170602321625, 0.0005293665453791618, 0.0005764160305261612, 0.0006234655156731606, 0.0006705150008201599, 0.0007175644859671593, 0.0007646139711141586, 0.000811663456261158, 0.0008587129414081573, 0.0009057624265551567, 0.0009528119117021561, 0.0009998613968491554, 0.0010469108819961548, 0.0010939603671431541, 0.0011410098522901535, 0.0011880593374371529, 0.0012351088225841522, 0.0012821583077311516, 0.001329207792878151, 0.0013762572780251503, 0.0014233067631721497, 0.001470356248319149, 0.0015174057334661484, 0.0015644552186131477, 0.001611504703760147, 0.0016585541889071465, 0.0017056036740541458, 0.0017526531592011452, 0.0017997026443481445]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 7.0, 9.0, 15.0, 20.0, 21.0, 27.0, 26.0, 19.0, 33.0, 35.0, 30.0, 26.0, 37.0, 41.0, 35.0, 45.0, 42.0, 36.0, 39.0, 42.0, 41.0, 37.0, 19.0, 35.0, 30.0, 28.0, 33.0, 22.0, 18.0, 17.0, 15.0, 19.0, 9.0, 10.0, 10.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.08984375, -4.93060302734375, -4.7713623046875, -4.61212158203125, -4.452880859375, -4.29364013671875, -4.1343994140625, -3.97515869140625, -3.81591796875, -3.65667724609375, -3.4974365234375, -3.33819580078125, -3.178955078125, -3.01971435546875, -2.8604736328125, -2.70123291015625, -2.5419921875, -2.38275146484375, -2.2235107421875, -2.06427001953125, -1.905029296875, -1.74578857421875, -1.5865478515625, -1.42730712890625, -1.26806640625, -1.10882568359375, -0.9495849609375, -0.79034423828125, -0.631103515625, -0.47186279296875, -0.3126220703125, -0.15338134765625, 0.005859375, 0.16510009765625, 0.3243408203125, 0.48358154296875, 0.642822265625, 0.80206298828125, 0.9613037109375, 1.12054443359375, 1.27978515625, 1.43902587890625, 1.5982666015625, 1.75750732421875, 1.916748046875, 2.07598876953125, 2.2352294921875, 2.39447021484375, 2.5537109375, 2.71295166015625, 2.8721923828125, 3.03143310546875, 3.190673828125, 3.34991455078125, 3.5091552734375, 3.66839599609375, 3.82763671875, 3.98687744140625, 4.1461181640625, 4.30535888671875, 4.464599609375, 4.62384033203125, 4.7830810546875, 4.94232177734375, 5.1015625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 8.0, 15.0, 19.0, 39.0, 33.0, 39.0, 43.0, 69.0, 90.0, 149.0, 205.0, 293.0, 543.0, 1281.0, 2963.0, 7343.0, 20230.0, 56617.0, 170653.0, 474360.0, 206738.0, 67361.0, 24017.0, 8846.0, 3436.0, 1432.0, 676.0, 327.0, 186.0, 130.0, 80.0, 67.0, 53.0, 39.0, 42.0, 33.0, 17.0, 14.0, 13.0, 9.0, 4.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.144287109375, -4.97607421875, -4.807861328125, -4.6396484375, -4.471435546875, -4.30322265625, -4.135009765625, -3.966796875, -3.798583984375, -3.63037109375, -3.462158203125, -3.2939453125, -3.125732421875, -2.95751953125, -2.789306640625, -2.62109375, -2.452880859375, -2.28466796875, -2.116455078125, -1.9482421875, -1.780029296875, -1.61181640625, -1.443603515625, -1.275390625, -1.107177734375, -0.93896484375, -0.770751953125, -0.6025390625, -0.434326171875, -0.26611328125, -0.097900390625, 0.0703125, 0.238525390625, 0.40673828125, 0.574951171875, 0.7431640625, 0.911376953125, 1.07958984375, 1.247802734375, 1.416015625, 1.584228515625, 1.75244140625, 1.920654296875, 2.0888671875, 2.257080078125, 2.42529296875, 2.593505859375, 2.76171875, 2.929931640625, 3.09814453125, 3.266357421875, 3.4345703125, 3.602783203125, 3.77099609375, 3.939208984375, 4.107421875, 4.275634765625, 4.44384765625, 4.612060546875, 4.7802734375, 4.948486328125, 5.11669921875, 5.284912109375, 5.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 13.0, 17.0, 19.0, 24.0, 23.0, 31.0, 28.0, 40.0, 33.0, 44.0, 54.0, 54.0, 69.0, 282.0, 1711.0, 136.0, 59.0, 53.0, 41.0, 41.0, 40.0, 33.0, 32.0, 22.0, 24.0, 16.0, 23.0, 13.0, 12.0, 10.0, 4.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.201416015625, -17.63720703125, -17.072998046875, -16.5087890625, -15.944580078125, -15.38037109375, -14.816162109375, -14.251953125, -13.687744140625, -13.12353515625, -12.559326171875, -11.9951171875, -11.430908203125, -10.86669921875, -10.302490234375, -9.73828125, -9.174072265625, -8.60986328125, -8.045654296875, -7.4814453125, -6.917236328125, -6.35302734375, -5.788818359375, -5.224609375, -4.660400390625, -4.09619140625, -3.531982421875, -2.9677734375, -2.403564453125, -1.83935546875, -1.275146484375, -0.7109375, -0.146728515625, 0.41748046875, 0.981689453125, 1.5458984375, 2.110107421875, 2.67431640625, 3.238525390625, 3.802734375, 4.366943359375, 4.93115234375, 5.495361328125, 6.0595703125, 6.623779296875, 7.18798828125, 7.752197265625, 8.31640625, 8.880615234375, 9.44482421875, 10.009033203125, 10.5732421875, 11.137451171875, 11.70166015625, 12.265869140625, 12.830078125, 13.394287109375, 13.95849609375, 14.522705078125, 15.0869140625, 15.651123046875, 16.21533203125, 16.779541015625, 17.34375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 13.0, 20.0, 25.0, 35.0, 52.0, 51.0, 74.0, 96.0, 163.0, 233.0, 397.0, 901.0, 6749.0, 3099277.0, 34907.0, 1262.0, 529.0, 279.0, 166.0, 117.0, 87.0, 60.0, 50.0, 36.0, 30.0, 16.0, 21.0, 11.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.541015625, -39.01953125, -37.498046875, -35.9765625, -34.455078125, -32.93359375, -31.412109375, -29.890625, -28.369140625, -26.84765625, -25.326171875, -23.8046875, -22.283203125, -20.76171875, -19.240234375, -17.71875, -16.197265625, -14.67578125, -13.154296875, -11.6328125, -10.111328125, -8.58984375, -7.068359375, -5.546875, -4.025390625, -2.50390625, -0.982421875, 0.5390625, 2.060546875, 3.58203125, 5.103515625, 6.625, 8.146484375, 9.66796875, 11.189453125, 12.7109375, 14.232421875, 15.75390625, 17.275390625, 18.796875, 20.318359375, 21.83984375, 23.361328125, 24.8828125, 26.404296875, 27.92578125, 29.447265625, 30.96875, 32.490234375, 34.01171875, 35.533203125, 37.0546875, 38.576171875, 40.09765625, 41.619140625, 43.140625, 44.662109375, 46.18359375, 47.705078125, 49.2265625, 50.748046875, 52.26953125, 53.791015625, 55.3125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 100.0, 843.0, 68.0, 3.0, 1.0, 0.0, 1.0], "bins": [-263.8231506347656, -259.3093566894531, -254.79559326171875, -250.2818145751953, -245.76803588867188, -241.25425720214844, -236.740478515625, -232.2266845703125, -227.71292114257812, -223.1991424560547, -218.68536376953125, -214.1715850830078, -209.65780639648438, -205.14402770996094, -200.6302490234375, -196.116455078125, -191.60267639160156, -187.08889770507812, -182.5751190185547, -178.06134033203125, -173.5475616455078, -169.03378295898438, -164.52000427246094, -160.0062255859375, -155.492431640625, -150.97865295410156, -146.46487426757812, -141.9510955810547, -137.43731689453125, -132.9235382080078, -128.40975952148438, -123.8959732055664, -119.38220977783203, -114.8684310913086, -110.35465240478516, -105.84087371826172, -101.32708740234375, -96.81330871582031, -92.29953002929688, -87.78575134277344, -83.27197265625, -78.75819396972656, -74.24441528320312, -69.73063659667969, -65.21685791015625, -60.70307540893555, -56.189292907714844, -51.675514221191406, -47.16173553466797, -42.64795684814453, -38.134178161621094, -33.62039566040039, -29.106616973876953, -24.592838287353516, -20.079057693481445, -15.565277099609375, -11.051496505737305, -6.537716865539551, -2.023937225341797, 2.489842414855957, 7.003622055053711, 11.517400741577148, 16.03118133544922, 20.54496192932129, 25.058740615844727]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 4.0, 7.0, 12.0, 5.0, 19.0, 17.0, 11.0, 17.0, 17.0, 13.0, 42.0, 36.0, 46.0, 35.0, 37.0, 38.0, 29.0, 38.0, 43.0, 34.0, 52.0, 48.0, 37.0, 39.0, 33.0, 39.0, 29.0, 26.0, 21.0, 26.0, 24.0, 15.0, 29.0, 12.0, 9.0, 10.0, 15.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-47.05217742919922, -45.647544860839844, -44.242916107177734, -42.838287353515625, -41.43365478515625, -40.029022216796875, -38.624393463134766, -37.219764709472656, -35.81513214111328, -34.410499572753906, -33.0058708190918, -31.601240158081055, -30.196609497070312, -28.79197883605957, -27.387348175048828, -25.982717514038086, -24.578086853027344, -23.1734561920166, -21.76882553100586, -20.364194869995117, -18.959564208984375, -17.554933547973633, -16.15030288696289, -14.745672225952148, -13.341041564941406, -11.936410903930664, -10.531780242919922, -9.12714958190918, -7.7225189208984375, -6.317888259887695, -4.913257598876953, -3.508626937866211, -2.1039962768554688, -0.6993656158447266, 0.7052650451660156, 2.109895706176758, 3.5145263671875, 4.919157028198242, 6.323787689208984, 7.728418350219727, 9.133049011230469, 10.537679672241211, 11.942310333251953, 13.346940994262695, 14.751571655273438, 16.15620231628418, 17.560832977294922, 18.965463638305664, 20.370094299316406, 21.77472496032715, 23.17935562133789, 24.583986282348633, 25.988616943359375, 27.393247604370117, 28.79787826538086, 30.2025089263916, 31.607139587402344, 33.01177215576172, 34.41640090942383, 35.82102966308594, 37.22566223144531, 38.63029479980469, 40.0349235534668, 41.439552307128906, 42.84418487548828]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 3.0, 7.0, 8.0, 11.0, 11.0, 18.0, 21.0, 19.0, 20.0, 29.0, 29.0, 33.0, 33.0, 25.0, 40.0, 35.0, 35.0, 36.0, 45.0, 41.0, 37.0, 33.0, 36.0, 33.0, 34.0, 40.0, 25.0, 25.0, 34.0, 27.0, 30.0, 15.0, 19.0, 14.0, 23.0, 12.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.2265625, -5.06298828125, -4.8994140625, -4.73583984375, -4.572265625, -4.40869140625, -4.2451171875, -4.08154296875, -3.91796875, -3.75439453125, -3.5908203125, -3.42724609375, -3.263671875, -3.10009765625, -2.9365234375, -2.77294921875, -2.609375, -2.44580078125, -2.2822265625, -2.11865234375, -1.955078125, -1.79150390625, -1.6279296875, -1.46435546875, -1.30078125, -1.13720703125, -0.9736328125, -0.81005859375, -0.646484375, -0.48291015625, -0.3193359375, -0.15576171875, 0.0078125, 0.17138671875, 0.3349609375, 0.49853515625, 0.662109375, 0.82568359375, 0.9892578125, 1.15283203125, 1.31640625, 1.47998046875, 1.6435546875, 1.80712890625, 1.970703125, 2.13427734375, 2.2978515625, 2.46142578125, 2.625, 2.78857421875, 2.9521484375, 3.11572265625, 3.279296875, 3.44287109375, 3.6064453125, 3.77001953125, 3.93359375, 4.09716796875, 4.2607421875, 4.42431640625, 4.587890625, 4.75146484375, 4.9150390625, 5.07861328125, 5.2421875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 15.0, 14.0, 21.0, 21.0, 39.0, 48.0, 45.0, 64.0, 103.0, 157.0, 298.0, 559.0, 1736.0, 11092.0, 286637.0, 3385640.0, 487788.0, 16158.0, 2198.0, 659.0, 316.0, 175.0, 131.0, 85.0, 61.0, 41.0, 25.0, 19.0, 24.0, 14.0, 14.0, 10.0, 12.0, 10.0, 12.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.21875, -18.646240234375, -18.07373046875, -17.501220703125, -16.9287109375, -16.356201171875, -15.78369140625, -15.211181640625, -14.638671875, -14.066162109375, -13.49365234375, -12.921142578125, -12.3486328125, -11.776123046875, -11.20361328125, -10.631103515625, -10.05859375, -9.486083984375, -8.91357421875, -8.341064453125, -7.7685546875, -7.196044921875, -6.62353515625, -6.051025390625, -5.478515625, -4.906005859375, -4.33349609375, -3.760986328125, -3.1884765625, -2.615966796875, -2.04345703125, -1.470947265625, -0.8984375, -0.325927734375, 0.24658203125, 0.819091796875, 1.3916015625, 1.964111328125, 2.53662109375, 3.109130859375, 3.681640625, 4.254150390625, 4.82666015625, 5.399169921875, 5.9716796875, 6.544189453125, 7.11669921875, 7.689208984375, 8.26171875, 8.834228515625, 9.40673828125, 9.979248046875, 10.5517578125, 11.124267578125, 11.69677734375, 12.269287109375, 12.841796875, 13.414306640625, 13.98681640625, 14.559326171875, 15.1318359375, 15.704345703125, 16.27685546875, 16.849365234375, 17.421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 17.0, 22.0, 34.0, 43.0, 58.0, 78.0, 129.0, 143.0, 174.0, 253.0, 402.0, 478.0, 550.0, 484.0, 334.0, 277.0, 176.0, 124.0, 72.0, 64.0, 34.0, 36.0, 18.0, 21.0, 10.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-15.1484375, -14.79852294921875, -14.4486083984375, -14.09869384765625, -13.748779296875, -13.39886474609375, -13.0489501953125, -12.69903564453125, -12.34912109375, -11.99920654296875, -11.6492919921875, -11.29937744140625, -10.949462890625, -10.59954833984375, -10.2496337890625, -9.89971923828125, -9.5498046875, -9.19989013671875, -8.8499755859375, -8.50006103515625, -8.150146484375, -7.80023193359375, -7.4503173828125, -7.10040283203125, -6.75048828125, -6.40057373046875, -6.0506591796875, -5.70074462890625, -5.350830078125, -5.00091552734375, -4.6510009765625, -4.30108642578125, -3.951171875, -3.60125732421875, -3.2513427734375, -2.90142822265625, -2.551513671875, -2.20159912109375, -1.8516845703125, -1.50177001953125, -1.15185546875, -0.80194091796875, -0.4520263671875, -0.10211181640625, 0.247802734375, 0.59771728515625, 0.9476318359375, 1.29754638671875, 1.6474609375, 1.99737548828125, 2.3472900390625, 2.69720458984375, 3.047119140625, 3.39703369140625, 3.7469482421875, 4.09686279296875, 4.44677734375, 4.79669189453125, 5.1466064453125, 5.49652099609375, 5.846435546875, 6.19635009765625, 6.5462646484375, 6.89617919921875, 7.24609375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 8.0, 16.0, 19.0, 28.0, 25.0, 47.0, 70.0, 88.0, 129.0, 168.0, 252.0, 329.0, 576.0, 2973.0, 2841722.0, 1343952.0, 2163.0, 478.0, 293.0, 226.0, 183.0, 134.0, 100.0, 74.0, 77.0, 58.0, 33.0, 21.0, 12.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -38.74609375, -36.8046875, -34.86328125, -32.921875, -30.98046875, -29.0390625, -27.09765625, -25.15625, -23.21484375, -21.2734375, -19.33203125, -17.390625, -15.44921875, -13.5078125, -11.56640625, -9.625, -7.68359375, -5.7421875, -3.80078125, -1.859375, 0.08203125, 2.0234375, 3.96484375, 5.90625, 7.84765625, 9.7890625, 11.73046875, 13.671875, 15.61328125, 17.5546875, 19.49609375, 21.4375, 23.37890625, 25.3203125, 27.26171875, 29.203125, 31.14453125, 33.0859375, 35.02734375, 36.96875, 38.91015625, 40.8515625, 42.79296875, 44.734375, 46.67578125, 48.6171875, 50.55859375, 52.5, 54.44140625, 56.3828125, 58.32421875, 60.265625, 62.20703125, 64.1484375, 66.08984375, 68.03125, 69.97265625, 71.9140625, 73.85546875, 75.796875, 77.73828125, 79.6796875, 81.62109375, 83.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 40.0, 206.0, 373.0, 276.0, 86.0, 22.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-197.3533935546875, -193.31011962890625, -189.266845703125, -185.2235870361328, -181.18031311035156, -177.1370391845703, -173.09378051757812, -169.05050659179688, -165.00723266601562, -160.96395874023438, -156.92068481445312, -152.87742614746094, -148.8341522216797, -144.79087829589844, -140.74761962890625, -136.704345703125, -132.66107177734375, -128.6177978515625, -124.57453155517578, -120.53126525878906, -116.48799133300781, -112.44471740722656, -108.40145111083984, -104.35818481445312, -100.31491088867188, -96.27163696289062, -92.2283706665039, -88.18510437011719, -84.14183044433594, -80.09855651855469, -76.05529022216797, -72.01202392578125, -67.96876525878906, -63.92549514770508, -59.882225036621094, -55.83895492553711, -51.795684814453125, -47.75241470336914, -43.709144592285156, -39.66587448120117, -35.62260437011719, -31.579334259033203, -27.53606414794922, -23.492794036865234, -19.44952392578125, -15.406253814697266, -11.362983703613281, -7.319713592529297, -3.2764434814453125, 0.7668266296386719, 4.810096740722656, 8.85336685180664, 12.896636962890625, 16.93990707397461, 20.983177185058594, 25.026447296142578, 29.069717407226562, 33.11298751831055, 37.15625762939453, 41.199527740478516, 45.2427978515625, 49.286067962646484, 53.32933807373047, 57.37260818481445, 61.41587829589844]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 1.0, 3.0, 3.0, 5.0, 8.0, 8.0, 11.0, 8.0, 12.0, 13.0, 17.0, 29.0, 25.0, 25.0, 38.0, 31.0, 24.0, 29.0, 50.0, 41.0, 35.0, 44.0, 42.0, 42.0, 31.0, 45.0, 43.0, 38.0, 33.0, 35.0, 37.0, 25.0, 31.0, 20.0, 24.0, 18.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.54911804199219, -32.466426849365234, -31.38373565673828, -30.301042556762695, -29.218351364135742, -28.13566017150879, -27.052967071533203, -25.97027587890625, -24.887584686279297, -23.804893493652344, -22.72220230102539, -21.639509201049805, -20.55681800842285, -19.4741268157959, -18.391433715820312, -17.30874252319336, -16.226051330566406, -15.143360137939453, -14.060667991638184, -12.977975845336914, -11.895284652709961, -10.812593460083008, -9.729901313781738, -8.647209167480469, -7.564517974853516, -6.481826305389404, -5.399134635925293, -4.316442966461182, -3.2337512969970703, -2.151059627532959, -1.0683679580688477, 0.014323711395263672, 1.097015380859375, 2.1797070503234863, 3.2623987197875977, 4.345090389251709, 5.42778205871582, 6.510473728179932, 7.593165397644043, 8.675857543945312, 9.758548736572266, 10.841239929199219, 11.923932075500488, 13.006624221801758, 14.089315414428711, 15.172006607055664, 16.25469970703125, 17.337390899658203, 18.420082092285156, 19.50277328491211, 20.585464477539062, 21.66815757751465, 22.7508487701416, 23.833539962768555, 24.91623306274414, 25.998924255371094, 27.081615447998047, 28.164306640625, 29.246997833251953, 30.32969093322754, 31.412382125854492, 32.49507522583008, 33.57776641845703, 34.660457611083984, 35.74314880371094]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 23.0, 21.0, 23.0, 20.0, 28.0, 42.0, 33.0, 27.0, 40.0, 25.0, 33.0, 48.0, 40.0, 46.0, 30.0, 38.0, 40.0, 36.0, 31.0, 36.0, 23.0, 28.0, 28.0, 26.0, 14.0, 18.0, 25.0, 13.0, 16.0, 18.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2578125, -5.0916748046875, -4.925537109375, -4.7593994140625, -4.59326171875, -4.4271240234375, -4.260986328125, -4.0948486328125, -3.9287109375, -3.7625732421875, -3.596435546875, -3.4302978515625, -3.26416015625, -3.0980224609375, -2.931884765625, -2.7657470703125, -2.599609375, -2.4334716796875, -2.267333984375, -2.1011962890625, -1.93505859375, -1.7689208984375, -1.602783203125, -1.4366455078125, -1.2705078125, -1.1043701171875, -0.938232421875, -0.7720947265625, -0.60595703125, -0.4398193359375, -0.273681640625, -0.1075439453125, 0.05859375, 0.2247314453125, 0.390869140625, 0.5570068359375, 0.72314453125, 0.8892822265625, 1.055419921875, 1.2215576171875, 1.3876953125, 1.5538330078125, 1.719970703125, 1.8861083984375, 2.05224609375, 2.2183837890625, 2.384521484375, 2.5506591796875, 2.716796875, 2.8829345703125, 3.049072265625, 3.2152099609375, 3.38134765625, 3.5474853515625, 3.713623046875, 3.8797607421875, 4.0458984375, 4.2120361328125, 4.378173828125, 4.5443115234375, 4.71044921875, 4.8765869140625, 5.042724609375, 5.2088623046875, 5.375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 8.0, 19.0, 33.0, 38.0, 52.0, 69.0, 112.0, 148.0, 235.0, 310.0, 489.0, 757.0, 1045.0, 1591.0, 2262.0, 3584.0, 5496.0, 8264.0, 12830.0, 20145.0, 32901.0, 55481.0, 96681.0, 168643.0, 227572.0, 168357.0, 96104.0, 54918.0, 32943.0, 20173.0, 12959.0, 8320.0, 5273.0, 3536.0, 2320.0, 1572.0, 1066.0, 738.0, 457.0, 345.0, 216.0, 151.0, 102.0, 63.0, 61.0, 34.0, 25.0, 18.0, 13.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.7509765625, -0.7278671264648438, -0.7047576904296875, -0.6816482543945312, -0.658538818359375, -0.6354293823242188, -0.6123199462890625, -0.5892105102539062, -0.56610107421875, -0.5429916381835938, -0.5198822021484375, -0.49677276611328125, -0.473663330078125, -0.45055389404296875, -0.4274444580078125, -0.40433502197265625, -0.3812255859375, -0.35811614990234375, -0.3350067138671875, -0.31189727783203125, -0.288787841796875, -0.26567840576171875, -0.2425689697265625, -0.21945953369140625, -0.19635009765625, -0.17324066162109375, -0.1501312255859375, -0.12702178955078125, -0.103912353515625, -0.08080291748046875, -0.0576934814453125, -0.03458404541015625, -0.011474609375, 0.01163482666015625, 0.0347442626953125, 0.05785369873046875, 0.080963134765625, 0.10407257080078125, 0.1271820068359375, 0.15029144287109375, 0.17340087890625, 0.19651031494140625, 0.2196197509765625, 0.24272918701171875, 0.265838623046875, 0.28894805908203125, 0.3120574951171875, 0.33516693115234375, 0.3582763671875, 0.38138580322265625, 0.4044952392578125, 0.42760467529296875, 0.450714111328125, 0.47382354736328125, 0.4969329833984375, 0.5200424194335938, 0.54315185546875, 0.5662612915039062, 0.5893707275390625, 0.6124801635742188, 0.635589599609375, 0.6586990356445312, 0.6818084716796875, 0.7049179077148438, 0.72802734375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 20.0, 16.0, 13.0, 23.0, 21.0, 20.0, 18.0, 29.0, 30.0, 28.0, 42.0, 43.0, 43.0, 40.0, 41.0, 1073.0, 54.0, 48.0, 37.0, 43.0, 38.0, 26.0, 34.0, 38.0, 28.0, 27.0, 23.0, 23.0, 16.0, 21.0, 13.0, 7.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.9140625, -2.796875, -2.6796875, -2.5625, -2.4453125, -2.328125, -2.2109375, -2.09375, -1.9765625, -1.859375, -1.7421875, -1.625, -1.5078125, -1.390625, -1.2734375, -1.15625, -1.0390625, -0.921875, -0.8046875, -0.6875, -0.5703125, -0.453125, -0.3359375, -0.21875, -0.1015625, 0.015625, 0.1328125, 0.25, 0.3671875, 0.484375, 0.6015625, 0.71875, 0.8359375, 0.953125, 1.0703125, 1.1875, 1.3046875, 1.421875, 1.5390625, 1.65625, 1.7734375, 1.890625, 2.0078125, 2.125, 2.2421875, 2.359375, 2.4765625, 2.59375, 2.7109375, 2.828125, 2.9453125, 3.0625, 3.1796875, 3.296875, 3.4140625, 3.53125, 3.6484375, 3.765625, 3.8828125, 4.0, 4.1171875, 4.234375, 4.3515625, 4.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 2.0, 8.0, 22.0, 18.0, 33.0, 51.0, 77.0, 115.0, 185.0, 322.0, 479.0, 800.0, 1231.0, 2086.0, 3654.0, 6430.0, 11224.0, 20418.0, 38084.0, 72566.0, 139336.0, 1172916.0, 338844.0, 135115.0, 69967.0, 37096.0, 19972.0, 11091.0, 6100.0, 3491.0, 2074.0, 1291.0, 762.0, 479.0, 303.0, 166.0, 102.0, 92.0, 47.0, 20.0, 20.0, 12.0, 14.0, 4.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6591644287109375, -0.637176513671875, -0.6151885986328125, -0.59320068359375, -0.5712127685546875, -0.549224853515625, -0.5272369384765625, -0.5052490234375, -0.4832611083984375, -0.461273193359375, -0.4392852783203125, -0.41729736328125, -0.3953094482421875, -0.373321533203125, -0.3513336181640625, -0.329345703125, -0.3073577880859375, -0.285369873046875, -0.2633819580078125, -0.24139404296875, -0.2194061279296875, -0.197418212890625, -0.1754302978515625, -0.1534423828125, -0.1314544677734375, -0.109466552734375, -0.0874786376953125, -0.06549072265625, -0.0435028076171875, -0.021514892578125, 0.0004730224609375, 0.0224609375, 0.0444488525390625, 0.066436767578125, 0.0884246826171875, 0.11041259765625, 0.1324005126953125, 0.154388427734375, 0.1763763427734375, 0.1983642578125, 0.2203521728515625, 0.242340087890625, 0.2643280029296875, 0.28631591796875, 0.3083038330078125, 0.330291748046875, 0.3522796630859375, 0.374267578125, 0.3962554931640625, 0.418243408203125, 0.4402313232421875, 0.46221923828125, 0.4842071533203125, 0.506195068359375, 0.5281829833984375, 0.5501708984375, 0.5721588134765625, 0.594146728515625, 0.6161346435546875, 0.63812255859375, 0.6601104736328125, 0.682098388671875, 0.7040863037109375, 0.72607421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 9.0, 13.0, 16.0, 20.0, 31.0, 45.0, 44.0, 54.0, 53.0, 57.0, 62.0, 67.0, 79.0, 54.0, 61.0, 52.0, 49.0, 39.0, 40.0, 24.0, 35.0, 19.0, 15.0, 15.0, 11.0, 6.0, 6.0, 4.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002292633056640625, -0.0022272467613220215, -0.002161860466003418, -0.0020964741706848145, -0.002031087875366211, -0.0019657015800476074, -0.001900315284729004, -0.0018349289894104004, -0.0017695426940917969, -0.0017041563987731934, -0.0016387701034545898, -0.0015733838081359863, -0.0015079975128173828, -0.0014426112174987793, -0.0013772249221801758, -0.0013118386268615723, -0.0012464523315429688, -0.0011810660362243652, -0.0011156797409057617, -0.0010502934455871582, -0.0009849071502685547, -0.0009195208549499512, -0.0008541345596313477, -0.0007887482643127441, -0.0007233619689941406, -0.0006579756736755371, -0.0005925893783569336, -0.0005272030830383301, -0.00046181678771972656, -0.00039643049240112305, -0.00033104419708251953, -0.000265657901763916, -0.0002002716064453125, -0.00013488531112670898, -6.949901580810547e-05, -4.112720489501953e-06, 6.127357482910156e-05, 0.00012665987014770508, 0.0001920461654663086, 0.0002574324607849121, 0.0003228187561035156, 0.00038820505142211914, 0.00045359134674072266, 0.0005189776420593262, 0.0005843639373779297, 0.0006497502326965332, 0.0007151365280151367, 0.0007805228233337402, 0.0008459091186523438, 0.0009112954139709473, 0.0009766817092895508, 0.0010420680046081543, 0.0011074542999267578, 0.0011728405952453613, 0.0012382268905639648, 0.0013036131858825684, 0.0013689994812011719, 0.0014343857765197754, 0.001499772071838379, 0.0015651583671569824, 0.001630544662475586, 0.0016959309577941895, 0.001761317253112793, 0.0018267035484313965, 0.00189208984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 11.0, 17.0, 19.0, 16.0, 30.0, 52.0, 52.0, 82.0, 80.0, 134.0, 243.0, 618.0, 10582.0, 1026347.0, 9007.0, 524.0, 229.0, 145.0, 97.0, 58.0, 55.0, 41.0, 23.0, 22.0, 17.0, 10.0, 7.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05224609375, -0.050685882568359375, -0.04912567138671875, -0.047565460205078125, -0.0460052490234375, -0.044445037841796875, -0.04288482666015625, -0.041324615478515625, -0.039764404296875, -0.038204193115234375, -0.03664398193359375, -0.035083770751953125, -0.0335235595703125, -0.031963348388671875, -0.03040313720703125, -0.028842926025390625, -0.02728271484375, -0.025722503662109375, -0.02416229248046875, -0.022602081298828125, -0.0210418701171875, -0.019481658935546875, -0.01792144775390625, -0.016361236572265625, -0.014801025390625, -0.013240814208984375, -0.01168060302734375, -0.010120391845703125, -0.0085601806640625, -0.006999969482421875, -0.00543975830078125, -0.003879547119140625, -0.0023193359375, -0.000759124755859375, 0.00080108642578125, 0.002361297607421875, 0.0039215087890625, 0.005481719970703125, 0.00704193115234375, 0.008602142333984375, 0.010162353515625, 0.011722564697265625, 0.01328277587890625, 0.014842987060546875, 0.0164031982421875, 0.017963409423828125, 0.01952362060546875, 0.021083831787109375, 0.02264404296875, 0.024204254150390625, 0.02576446533203125, 0.027324676513671875, 0.0288848876953125, 0.030445098876953125, 0.03200531005859375, 0.033565521240234375, 0.035125732421875, 0.036685943603515625, 0.03824615478515625, 0.039806365966796875, 0.0413665771484375, 0.042926788330078125, 0.04448699951171875, 0.046047210693359375, 0.047607421875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 18.0, 34.0, 96.0, 187.0, 239.0, 222.0, 125.0, 58.0, 14.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004594548139721155, -0.0045001995749771595, -0.004405851010233164, -0.0043115029111504555, -0.00421715434640646, -0.004122805781662464, -0.0040284572169184685, -0.003934108652174473, -0.003839760320261121, -0.003745411755517125, -0.003651063423603773, -0.0035567148588597775, -0.0034623665269464254, -0.0033680179622024298, -0.0032736696302890778, -0.003179321065545082, -0.0030849725008010864, -0.0029906239360570908, -0.0028962756041437387, -0.002801927039399743, -0.002707578707486391, -0.0026132301427423954, -0.0025188815779983997, -0.0024245332460850477, -0.0023301849141716957, -0.0022358363494277, -0.002141488017514348, -0.0020471394527703524, -0.0019527910044416785, -0.0018584425561130047, -0.0017640941077843308, -0.001669745659455657, -0.0015753972111269832, -0.0014810487627983093, -0.0013867003144696355, -0.0012923518661409616, -0.001198003301396966, -0.0011036548530682921, -0.0010093064047396183, -0.0009149578982032835, -0.0008206094498746097, -0.0007262610015459359, -0.0006319124950096011, -0.0005375640466809273, -0.000443215569248423, -0.0003488670918159187, -0.00025451864348724484, -0.0001601701369509101, -6.582168862223625e-05, 2.852678153431043e-05, 0.0001228752516908571, 0.00021722371457144618, 0.0003115721920039505, 0.0004059206694364548, 0.0005002691177651286, 0.0005946176243014634, 0.0006889660726301372, 0.000783314520958811, 0.0008776630274951458, 0.0009720114758238196, 0.0010663599241524935, 0.0011607084888964891, 0.0012550568208098412, 0.0013494053855538368, 0.0014437538338825107]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 9.0, 10.0, 14.0, 16.0, 18.0, 21.0, 23.0, 25.0, 28.0, 25.0, 39.0, 48.0, 38.0, 42.0, 39.0, 40.0, 40.0, 35.0, 40.0, 35.0, 42.0, 39.0, 38.0, 40.0, 31.0, 36.0, 32.0, 22.0, 17.0, 15.0, 23.0, 23.0, 7.0, 9.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009667873382568359, -0.0009367233142256737, -0.0009066592901945114, -0.0008765952661633492, -0.0008465312421321869, -0.0008164672181010246, -0.0007864031940698624, -0.0007563391700387001, -0.0007262751460075378, -0.0006962111219763756, -0.0006661470979452133, -0.0006360830739140511, -0.0006060190498828888, -0.0005759550258517265, -0.0005458910018205643, -0.000515826977789402, -0.00048576295375823975, -0.0004556989297270775, -0.0004256349056959152, -0.00039557088166475296, -0.0003655068576335907, -0.00033544283360242844, -0.0003053788095712662, -0.0002753147855401039, -0.00024525076150894165, -0.0002151867374777794, -0.00018512271344661713, -0.00015505868941545486, -0.0001249946653842926, -9.493064135313034e-05, -6.486661732196808e-05, -3.480259329080582e-05, -4.738569259643555e-06, 2.5325454771518707e-05, 5.538947880268097e-05, 8.545350283384323e-05, 0.00011551752686500549, 0.00014558155089616776, 0.00017564557492733002, 0.00020570959895849228, 0.00023577362298965454, 0.0002658376470208168, 0.00029590167105197906, 0.0003259656950831413, 0.0003560297191143036, 0.00038609374314546585, 0.0004161577671766281, 0.0004462217912077904, 0.00047628581523895264, 0.0005063498392701149, 0.0005364138633012772, 0.0005664778873324394, 0.0005965419113636017, 0.000626605935394764, 0.0006566699594259262, 0.0006867339834570885, 0.0007167980074882507, 0.000746862031519413, 0.0007769260555505753, 0.0008069900795817375, 0.0008370541036128998, 0.000867118127644062, 0.0008971821516752243, 0.0009272461757063866, 0.0009573101997375488]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 23.0, 21.0, 23.0, 20.0, 28.0, 42.0, 33.0, 27.0, 40.0, 25.0, 33.0, 48.0, 40.0, 46.0, 30.0, 38.0, 40.0, 36.0, 31.0, 36.0, 23.0, 28.0, 28.0, 26.0, 14.0, 18.0, 25.0, 13.0, 16.0, 18.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2578125, -5.0916748046875, -4.925537109375, -4.7593994140625, -4.59326171875, -4.4271240234375, -4.260986328125, -4.0948486328125, -3.9287109375, -3.7625732421875, -3.596435546875, -3.4302978515625, -3.26416015625, -3.0980224609375, -2.931884765625, -2.7657470703125, -2.599609375, -2.4334716796875, -2.267333984375, -2.1011962890625, -1.93505859375, -1.7689208984375, -1.602783203125, -1.4366455078125, -1.2705078125, -1.1043701171875, -0.938232421875, -0.7720947265625, -0.60595703125, -0.4398193359375, -0.273681640625, -0.1075439453125, 0.05859375, 0.2247314453125, 0.390869140625, 0.5570068359375, 0.72314453125, 0.8892822265625, 1.055419921875, 1.2215576171875, 1.3876953125, 1.5538330078125, 1.719970703125, 1.8861083984375, 2.05224609375, 2.2183837890625, 2.384521484375, 2.5506591796875, 2.716796875, 2.8829345703125, 3.049072265625, 3.2152099609375, 3.38134765625, 3.5474853515625, 3.713623046875, 3.8797607421875, 4.0458984375, 4.2120361328125, 4.378173828125, 4.5443115234375, 4.71044921875, 4.8765869140625, 5.042724609375, 5.2088623046875, 5.375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 13.0, 11.0, 17.0, 18.0, 20.0, 25.0, 42.0, 46.0, 75.0, 78.0, 112.0, 168.0, 220.0, 334.0, 583.0, 992.0, 2986.0, 15867.0, 120079.0, 753048.0, 130858.0, 16948.0, 3156.0, 1088.0, 598.0, 318.0, 211.0, 158.0, 101.0, 83.0, 59.0, 51.0, 43.0, 23.0, 28.0, 24.0, 15.0, 16.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.425537109375, -9.11669921875, -8.807861328125, -8.4990234375, -8.190185546875, -7.88134765625, -7.572509765625, -7.263671875, -6.954833984375, -6.64599609375, -6.337158203125, -6.0283203125, -5.719482421875, -5.41064453125, -5.101806640625, -4.79296875, -4.484130859375, -4.17529296875, -3.866455078125, -3.5576171875, -3.248779296875, -2.93994140625, -2.631103515625, -2.322265625, -2.013427734375, -1.70458984375, -1.395751953125, -1.0869140625, -0.778076171875, -0.46923828125, -0.160400390625, 0.1484375, 0.457275390625, 0.76611328125, 1.074951171875, 1.3837890625, 1.692626953125, 2.00146484375, 2.310302734375, 2.619140625, 2.927978515625, 3.23681640625, 3.545654296875, 3.8544921875, 4.163330078125, 4.47216796875, 4.781005859375, 5.08984375, 5.398681640625, 5.70751953125, 6.016357421875, 6.3251953125, 6.634033203125, 6.94287109375, 7.251708984375, 7.560546875, 7.869384765625, 8.17822265625, 8.487060546875, 8.7958984375, 9.104736328125, 9.41357421875, 9.722412109375, 10.03125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 9.0, 7.0, 12.0, 8.0, 18.0, 18.0, 25.0, 29.0, 34.0, 27.0, 24.0, 37.0, 46.0, 45.0, 50.0, 67.0, 214.0, 1698.0, 154.0, 76.0, 47.0, 45.0, 41.0, 29.0, 24.0, 34.0, 28.0, 26.0, 21.0, 19.0, 16.0, 12.0, 12.0, 11.0, 10.0, 9.0, 12.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.828125, -15.307373046875, -14.78662109375, -14.265869140625, -13.7451171875, -13.224365234375, -12.70361328125, -12.182861328125, -11.662109375, -11.141357421875, -10.62060546875, -10.099853515625, -9.5791015625, -9.058349609375, -8.53759765625, -8.016845703125, -7.49609375, -6.975341796875, -6.45458984375, -5.933837890625, -5.4130859375, -4.892333984375, -4.37158203125, -3.850830078125, -3.330078125, -2.809326171875, -2.28857421875, -1.767822265625, -1.2470703125, -0.726318359375, -0.20556640625, 0.315185546875, 0.8359375, 1.356689453125, 1.87744140625, 2.398193359375, 2.9189453125, 3.439697265625, 3.96044921875, 4.481201171875, 5.001953125, 5.522705078125, 6.04345703125, 6.564208984375, 7.0849609375, 7.605712890625, 8.12646484375, 8.647216796875, 9.16796875, 9.688720703125, 10.20947265625, 10.730224609375, 11.2509765625, 11.771728515625, 12.29248046875, 12.813232421875, 13.333984375, 13.854736328125, 14.37548828125, 14.896240234375, 15.4169921875, 15.937744140625, 16.45849609375, 16.979248046875, 17.5]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 4.0, 14.0, 13.0, 10.0, 17.0, 16.0, 20.0, 19.0, 28.0, 35.0, 43.0, 41.0, 70.0, 87.0, 121.0, 204.0, 388.0, 926.0, 23779.0, 3112229.0, 5998.0, 656.0, 282.0, 187.0, 121.0, 79.0, 49.0, 50.0, 47.0, 30.0, 23.0, 19.0, 14.0, 13.0, 8.0, 10.0, 8.0, 14.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-52.5, -50.8779296875, -49.255859375, -47.6337890625, -46.01171875, -44.3896484375, -42.767578125, -41.1455078125, -39.5234375, -37.9013671875, -36.279296875, -34.6572265625, -33.03515625, -31.4130859375, -29.791015625, -28.1689453125, -26.546875, -24.9248046875, -23.302734375, -21.6806640625, -20.05859375, -18.4365234375, -16.814453125, -15.1923828125, -13.5703125, -11.9482421875, -10.326171875, -8.7041015625, -7.08203125, -5.4599609375, -3.837890625, -2.2158203125, -0.59375, 1.0283203125, 2.650390625, 4.2724609375, 5.89453125, 7.5166015625, 9.138671875, 10.7607421875, 12.3828125, 14.0048828125, 15.626953125, 17.2490234375, 18.87109375, 20.4931640625, 22.115234375, 23.7373046875, 25.359375, 26.9814453125, 28.603515625, 30.2255859375, 31.84765625, 33.4697265625, 35.091796875, 36.7138671875, 38.3359375, 39.9580078125, 41.580078125, 43.2021484375, 44.82421875, 46.4462890625, 48.068359375, 49.6904296875, 51.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 47.0, 208.0, 376.0, 272.0, 86.0, 15.0, 3.0], "bins": [-83.17974853515625, -81.78570556640625, -80.39166259765625, -78.99762725830078, -77.60358428955078, -76.20954132080078, -74.81549835205078, -73.42146301269531, -72.02742004394531, -70.63337707519531, -69.23933410644531, -67.84529876708984, -66.45125579833984, -65.05721282958984, -63.66317367553711, -62.26913070678711, -60.875091552734375, -59.481048583984375, -58.08700942993164, -56.69296646118164, -55.298927307128906, -53.904884338378906, -52.51084518432617, -51.11680221557617, -49.72275924682617, -48.32871627807617, -46.93467712402344, -45.54063415527344, -44.1465950012207, -42.7525520324707, -41.35851287841797, -39.96446990966797, -38.570430755615234, -37.176387786865234, -35.7823486328125, -34.3883056640625, -32.994266510009766, -31.6002254486084, -30.20618438720703, -28.81214141845703, -27.418100357055664, -26.024059295654297, -24.63001823425293, -23.235977172851562, -21.841936111450195, -20.447895050048828, -19.053852081298828, -17.659812927246094, -16.265769958496094, -14.871728897094727, -13.47768783569336, -12.083646774291992, -10.689605712890625, -9.295564651489258, -7.901522636413574, -6.507481575012207, -5.113441467285156, -3.719400405883789, -2.3253591060638428, -0.9313178062438965, 0.4627232551574707, 1.856764316558838, 3.2508058547973633, 4.6448469161987305, 6.038887977600098]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 7.0, 4.0, 7.0, 6.0, 13.0, 14.0, 8.0, 14.0, 12.0, 16.0, 21.0, 21.0, 26.0, 30.0, 25.0, 23.0, 25.0, 24.0, 34.0, 37.0, 32.0, 35.0, 49.0, 50.0, 35.0, 27.0, 38.0, 29.0, 26.0, 22.0, 27.0, 29.0, 31.0, 24.0, 24.0, 18.0, 27.0, 18.0, 18.0, 20.0, 9.0, 9.0, 8.0, 6.0, 11.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-46.25877380371094, -44.89012145996094, -43.52146911621094, -42.15281677246094, -40.78416061401367, -39.41550827026367, -38.04685592651367, -36.67820358276367, -35.309547424316406, -33.940895080566406, -32.572242736816406, -31.203588485717773, -29.83493423461914, -28.46628189086914, -27.09762954711914, -25.72897720336914, -24.36032485961914, -22.99167251586914, -21.623018264770508, -20.254365921020508, -18.885711669921875, -17.517059326171875, -16.148406982421875, -14.779753684997559, -13.411100387573242, -12.042447090148926, -10.67379379272461, -9.30514144897461, -7.936488151550293, -6.567834854125977, -5.199182510375977, -3.83052921295166, -2.461872100830078, -1.0932190418243408, 0.2754340171813965, 1.6440868377685547, 3.012740135192871, 4.3813934326171875, 5.7500457763671875, 7.118699073791504, 8.48735237121582, 9.856005668640137, 11.224658966064453, 12.593311309814453, 13.96196460723877, 15.330617904663086, 16.699270248413086, 18.06792449951172, 19.43657684326172, 20.80522918701172, 22.17388343811035, 23.54253578186035, 24.911190032958984, 26.279842376708984, 27.648494720458984, 29.017147064208984, 30.385801315307617, 31.754453659057617, 33.12310791015625, 34.49176025390625, 35.86041259765625, 37.22906494140625, 38.59771728515625, 39.966373443603516, 41.335025787353516]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 7.0, 15.0, 11.0, 18.0, 18.0, 24.0, 19.0, 27.0, 31.0, 23.0, 32.0, 32.0, 33.0, 35.0, 38.0, 37.0, 37.0, 45.0, 47.0, 49.0, 34.0, 29.0, 37.0, 31.0, 20.0, 33.0, 20.0, 33.0, 24.0, 15.0, 14.0, 19.0, 20.0, 12.0, 13.0, 16.0, 7.0, 10.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.05859375, -5.8802490234375, -5.701904296875, -5.5235595703125, -5.34521484375, -5.1668701171875, -4.988525390625, -4.8101806640625, -4.6318359375, -4.4534912109375, -4.275146484375, -4.0968017578125, -3.91845703125, -3.7401123046875, -3.561767578125, -3.3834228515625, -3.205078125, -3.0267333984375, -2.848388671875, -2.6700439453125, -2.49169921875, -2.3133544921875, -2.135009765625, -1.9566650390625, -1.7783203125, -1.5999755859375, -1.421630859375, -1.2432861328125, -1.06494140625, -0.8865966796875, -0.708251953125, -0.5299072265625, -0.3515625, -0.1732177734375, 0.005126953125, 0.1834716796875, 0.36181640625, 0.5401611328125, 0.718505859375, 0.8968505859375, 1.0751953125, 1.2535400390625, 1.431884765625, 1.6102294921875, 1.78857421875, 1.9669189453125, 2.145263671875, 2.3236083984375, 2.501953125, 2.6802978515625, 2.858642578125, 3.0369873046875, 3.21533203125, 3.3936767578125, 3.572021484375, 3.7503662109375, 3.9287109375, 4.1070556640625, 4.285400390625, 4.4637451171875, 4.64208984375, 4.8204345703125, 4.998779296875, 5.1771240234375, 5.35546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 7.0, 16.0, 23.0, 29.0, 37.0, 53.0, 83.0, 95.0, 178.0, 320.0, 632.0, 1495.0, 4136.0, 12722.0, 50101.0, 276236.0, 1176925.0, 1796704.0, 703808.0, 128885.0, 28331.0, 8126.0, 2880.0, 1162.0, 532.0, 267.0, 171.0, 87.0, 67.0, 53.0, 40.0, 15.0, 22.0, 19.0, 11.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-10.6171875, -10.34698486328125, -10.0767822265625, -9.80657958984375, -9.536376953125, -9.26617431640625, -8.9959716796875, -8.72576904296875, -8.45556640625, -8.18536376953125, -7.9151611328125, -7.64495849609375, -7.374755859375, -7.10455322265625, -6.8343505859375, -6.56414794921875, -6.2939453125, -6.02374267578125, -5.7535400390625, -5.48333740234375, -5.213134765625, -4.94293212890625, -4.6727294921875, -4.40252685546875, -4.13232421875, -3.86212158203125, -3.5919189453125, -3.32171630859375, -3.051513671875, -2.78131103515625, -2.5111083984375, -2.24090576171875, -1.970703125, -1.70050048828125, -1.4302978515625, -1.16009521484375, -0.889892578125, -0.61968994140625, -0.3494873046875, -0.07928466796875, 0.19091796875, 0.46112060546875, 0.7313232421875, 1.00152587890625, 1.271728515625, 1.54193115234375, 1.8121337890625, 2.08233642578125, 2.3525390625, 2.62274169921875, 2.8929443359375, 3.16314697265625, 3.433349609375, 3.70355224609375, 3.9737548828125, 4.24395751953125, 4.51416015625, 4.78436279296875, 5.0545654296875, 5.32476806640625, 5.594970703125, 5.86517333984375, 6.1353759765625, 6.40557861328125, 6.67578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 13.0, 18.0, 24.0, 40.0, 36.0, 52.0, 87.0, 103.0, 125.0, 189.0, 214.0, 265.0, 363.0, 384.0, 407.0, 392.0, 318.0, 276.0, 179.0, 123.0, 111.0, 76.0, 57.0, 41.0, 39.0, 27.0, 30.0, 16.0, 15.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.46875, -12.1422119140625, -11.815673828125, -11.4891357421875, -11.16259765625, -10.8360595703125, -10.509521484375, -10.1829833984375, -9.8564453125, -9.5299072265625, -9.203369140625, -8.8768310546875, -8.55029296875, -8.2237548828125, -7.897216796875, -7.5706787109375, -7.244140625, -6.9176025390625, -6.591064453125, -6.2645263671875, -5.93798828125, -5.6114501953125, -5.284912109375, -4.9583740234375, -4.6318359375, -4.3052978515625, -3.978759765625, -3.6522216796875, -3.32568359375, -2.9991455078125, -2.672607421875, -2.3460693359375, -2.01953125, -1.6929931640625, -1.366455078125, -1.0399169921875, -0.71337890625, -0.3868408203125, -0.060302734375, 0.2662353515625, 0.5927734375, 0.9193115234375, 1.245849609375, 1.5723876953125, 1.89892578125, 2.2254638671875, 2.552001953125, 2.8785400390625, 3.205078125, 3.5316162109375, 3.858154296875, 4.1846923828125, 4.51123046875, 4.8377685546875, 5.164306640625, 5.4908447265625, 5.8173828125, 6.1439208984375, 6.470458984375, 6.7969970703125, 7.12353515625, 7.4500732421875, 7.776611328125, 8.1031494140625, 8.4296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 13.0, 27.0, 16.0, 36.0, 28.0, 66.0, 75.0, 91.0, 127.0, 139.0, 199.0, 266.0, 384.0, 654.0, 1538.0, 15070.0, 3276531.0, 889409.0, 6631.0, 1026.0, 528.0, 325.0, 277.0, 209.0, 135.0, 102.0, 95.0, 66.0, 49.0, 40.0, 33.0, 25.0, 14.0, 15.0, 12.0, 1.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75, -31.43359375, -30.1171875, -28.80078125, -27.484375, -26.16796875, -24.8515625, -23.53515625, -22.21875, -20.90234375, -19.5859375, -18.26953125, -16.953125, -15.63671875, -14.3203125, -13.00390625, -11.6875, -10.37109375, -9.0546875, -7.73828125, -6.421875, -5.10546875, -3.7890625, -2.47265625, -1.15625, 0.16015625, 1.4765625, 2.79296875, 4.109375, 5.42578125, 6.7421875, 8.05859375, 9.375, 10.69140625, 12.0078125, 13.32421875, 14.640625, 15.95703125, 17.2734375, 18.58984375, 19.90625, 21.22265625, 22.5390625, 23.85546875, 25.171875, 26.48828125, 27.8046875, 29.12109375, 30.4375, 31.75390625, 33.0703125, 34.38671875, 35.703125, 37.01953125, 38.3359375, 39.65234375, 40.96875, 42.28515625, 43.6015625, 44.91796875, 46.234375, 47.55078125, 48.8671875, 50.18359375, 51.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 436.0, 532.0, 30.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-486.7415466308594, -477.9002685546875, -469.0589904785156, -460.21771240234375, -451.3764343261719, -442.53515625, -433.6938781738281, -424.85260009765625, -416.0113220214844, -407.1700439453125, -398.3287658691406, -389.48748779296875, -380.6462097167969, -371.804931640625, -362.9636535644531, -354.12237548828125, -345.2811279296875, -336.4398498535156, -327.59857177734375, -318.7572937011719, -309.916015625, -301.0747375488281, -292.23345947265625, -283.3921813964844, -274.5509033203125, -265.7096252441406, -256.86834716796875, -248.02706909179688, -239.185791015625, -230.34451293945312, -221.50323486328125, -212.66195678710938, -203.82070922851562, -194.97943115234375, -186.13815307617188, -177.296875, -168.45559692382812, -159.61431884765625, -150.77304077148438, -141.9317626953125, -133.09048461914062, -124.24920654296875, -115.40792846679688, -106.566650390625, -97.72537231445312, -88.88409423828125, -80.0428237915039, -71.20154571533203, -62.360267639160156, -53.51898956298828, -44.677711486816406, -35.8364372253418, -26.995159149169922, -18.153881072998047, -9.312606811523438, -0.4713287353515625, 8.369949340820312, 17.211227416992188, 26.05250358581543, 34.89377975463867, 43.73505783081055, 52.57633590698242, 61.41761016845703, 70.2588882446289, 79.10016632080078]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 10.0, 16.0, 12.0, 9.0, 25.0, 17.0, 21.0, 22.0, 21.0, 28.0, 27.0, 47.0, 49.0, 34.0, 56.0, 31.0, 39.0, 32.0, 44.0, 39.0, 43.0, 27.0, 33.0, 33.0, 25.0, 32.0, 21.0, 28.0, 28.0, 14.0, 25.0, 26.0, 11.0, 11.0, 11.0, 6.0, 3.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-36.28489685058594, -35.20779037475586, -34.13068389892578, -33.0535774230957, -31.976472854614258, -30.89936637878418, -29.822261810302734, -28.745155334472656, -27.668048858642578, -26.5909423828125, -25.513835906982422, -24.436731338500977, -23.3596248626709, -22.28251838684082, -21.205413818359375, -20.128307342529297, -19.05120086669922, -17.97409439086914, -16.896987915039062, -15.819883346557617, -14.742776870727539, -13.665670394897461, -12.5885648727417, -11.511459350585938, -10.43435287475586, -9.357246398925781, -8.28014087677002, -7.2030348777771, -6.12592887878418, -5.04882287979126, -3.97171688079834, -2.89461088180542, -1.8175048828125, -0.7403988838195801, 0.33670711517333984, 1.4138131141662598, 2.4909191131591797, 3.5680251121520996, 4.6451311111450195, 5.7222371101379395, 6.799343109130859, 7.876449108123779, 8.9535551071167, 10.030660629272461, 11.107767105102539, 12.184873580932617, 13.261979103088379, 14.33908462524414, 15.416191101074219, 16.493297576904297, 17.570404052734375, 18.64750862121582, 19.7246150970459, 20.801721572875977, 21.878826141357422, 22.9559326171875, 24.033039093017578, 25.110145568847656, 26.187252044677734, 27.26435661315918, 28.341463088989258, 29.418569564819336, 30.49567413330078, 31.57278060913086, 32.64988708496094]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 9.0, 8.0, 8.0, 13.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 24.0, 26.0, 39.0, 17.0, 31.0, 24.0, 28.0, 33.0, 48.0, 36.0, 34.0, 43.0, 37.0, 32.0, 34.0, 27.0, 31.0, 32.0, 28.0, 36.0, 23.0, 23.0, 19.0, 21.0, 18.0, 18.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-5.20703125, -5.04876708984375, -4.8905029296875, -4.73223876953125, -4.573974609375, -4.41571044921875, -4.2574462890625, -4.09918212890625, -3.94091796875, -3.78265380859375, -3.6243896484375, -3.46612548828125, -3.307861328125, -3.14959716796875, -2.9913330078125, -2.83306884765625, -2.6748046875, -2.51654052734375, -2.3582763671875, -2.20001220703125, -2.041748046875, -1.88348388671875, -1.7252197265625, -1.56695556640625, -1.40869140625, -1.25042724609375, -1.0921630859375, -0.93389892578125, -0.775634765625, -0.61737060546875, -0.4591064453125, -0.30084228515625, -0.142578125, 0.01568603515625, 0.1739501953125, 0.33221435546875, 0.490478515625, 0.64874267578125, 0.8070068359375, 0.96527099609375, 1.12353515625, 1.28179931640625, 1.4400634765625, 1.59832763671875, 1.756591796875, 1.91485595703125, 2.0731201171875, 2.23138427734375, 2.3896484375, 2.54791259765625, 2.7061767578125, 2.86444091796875, 3.022705078125, 3.18096923828125, 3.3392333984375, 3.49749755859375, 3.65576171875, 3.81402587890625, 3.9722900390625, 4.13055419921875, 4.288818359375, 4.44708251953125, 4.6053466796875, 4.76361083984375, 4.921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 7.0, 10.0, 29.0, 37.0, 41.0, 45.0, 89.0, 112.0, 187.0, 258.0, 423.0, 654.0, 866.0, 1303.0, 1878.0, 2717.0, 4190.0, 6313.0, 9689.0, 15092.0, 23952.0, 39169.0, 66442.0, 116878.0, 198392.0, 218805.0, 139022.0, 78785.0, 45588.0, 27660.0, 17194.0, 11044.0, 7196.0, 4774.0, 3161.0, 2106.0, 1414.0, 978.0, 672.0, 445.0, 296.0, 197.0, 143.0, 93.0, 79.0, 37.0, 27.0, 25.0, 20.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 1.0], "bins": [-0.767578125, -0.7444229125976562, -0.7212677001953125, -0.6981124877929688, -0.674957275390625, -0.6518020629882812, -0.6286468505859375, -0.6054916381835938, -0.58233642578125, -0.5591812133789062, -0.5360260009765625, -0.5128707885742188, -0.489715576171875, -0.46656036376953125, -0.4434051513671875, -0.42024993896484375, -0.3970947265625, -0.37393951416015625, -0.3507843017578125, -0.32762908935546875, -0.304473876953125, -0.28131866455078125, -0.2581634521484375, -0.23500823974609375, -0.21185302734375, -0.18869781494140625, -0.1655426025390625, -0.14238739013671875, -0.119232177734375, -0.09607696533203125, -0.0729217529296875, -0.04976654052734375, -0.026611328125, -0.00345611572265625, 0.0196990966796875, 0.04285430908203125, 0.066009521484375, 0.08916473388671875, 0.1123199462890625, 0.13547515869140625, 0.15863037109375, 0.18178558349609375, 0.2049407958984375, 0.22809600830078125, 0.251251220703125, 0.27440643310546875, 0.2975616455078125, 0.32071685791015625, 0.3438720703125, 0.36702728271484375, 0.3901824951171875, 0.41333770751953125, 0.436492919921875, 0.45964813232421875, 0.4828033447265625, 0.5059585571289062, 0.52911376953125, 0.5522689819335938, 0.5754241943359375, 0.5985794067382812, 0.621734619140625, 0.6448898315429688, 0.6680450439453125, 0.6912002563476562, 0.71435546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 17.0, 10.0, 24.0, 14.0, 21.0, 29.0, 17.0, 20.0, 31.0, 39.0, 30.0, 45.0, 46.0, 42.0, 49.0, 37.0, 1068.0, 42.0, 36.0, 31.0, 46.0, 30.0, 36.0, 35.0, 32.0, 29.0, 22.0, 12.0, 18.0, 13.0, 12.0, 19.0, 13.0, 7.0, 6.0, 11.0, 1.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.363861083984375, -3.24139404296875, -3.118927001953125, -2.9964599609375, -2.873992919921875, -2.75152587890625, -2.629058837890625, -2.506591796875, -2.384124755859375, -2.26165771484375, -2.139190673828125, -2.0167236328125, -1.894256591796875, -1.77178955078125, -1.649322509765625, -1.52685546875, -1.404388427734375, -1.28192138671875, -1.159454345703125, -1.0369873046875, -0.914520263671875, -0.79205322265625, -0.669586181640625, -0.547119140625, -0.424652099609375, -0.30218505859375, -0.179718017578125, -0.0572509765625, 0.065216064453125, 0.18768310546875, 0.310150146484375, 0.4326171875, 0.555084228515625, 0.67755126953125, 0.800018310546875, 0.9224853515625, 1.044952392578125, 1.16741943359375, 1.289886474609375, 1.412353515625, 1.534820556640625, 1.65728759765625, 1.779754638671875, 1.9022216796875, 2.024688720703125, 2.14715576171875, 2.269622802734375, 2.39208984375, 2.514556884765625, 2.63702392578125, 2.759490966796875, 2.8819580078125, 3.004425048828125, 3.12689208984375, 3.249359130859375, 3.371826171875, 3.494293212890625, 3.61676025390625, 3.739227294921875, 3.8616943359375, 3.984161376953125, 4.10662841796875, 4.229095458984375, 4.3515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 10.0, 18.0, 27.0, 51.0, 87.0, 129.0, 194.0, 329.0, 579.0, 996.0, 1629.0, 2829.0, 4889.0, 8850.0, 15937.0, 29633.0, 55331.0, 107766.0, 200992.0, 1304456.0, 172160.0, 88494.0, 46477.0, 24829.0, 13304.0, 7356.0, 4132.0, 2327.0, 1300.0, 762.0, 462.0, 279.0, 173.0, 111.0, 71.0, 46.0, 37.0, 18.0, 15.0, 18.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.84716796875, -0.8238677978515625, -0.800567626953125, -0.7772674560546875, -0.75396728515625, -0.7306671142578125, -0.707366943359375, -0.6840667724609375, -0.6607666015625, -0.6374664306640625, -0.614166259765625, -0.5908660888671875, -0.56756591796875, -0.5442657470703125, -0.520965576171875, -0.4976654052734375, -0.474365234375, -0.4510650634765625, -0.427764892578125, -0.4044647216796875, -0.38116455078125, -0.3578643798828125, -0.334564208984375, -0.3112640380859375, -0.2879638671875, -0.2646636962890625, -0.241363525390625, -0.2180633544921875, -0.19476318359375, -0.1714630126953125, -0.148162841796875, -0.1248626708984375, -0.1015625, -0.0782623291015625, -0.054962158203125, -0.0316619873046875, -0.00836181640625, 0.0149383544921875, 0.038238525390625, 0.0615386962890625, 0.0848388671875, 0.1081390380859375, 0.131439208984375, 0.1547393798828125, 0.17803955078125, 0.2013397216796875, 0.224639892578125, 0.2479400634765625, 0.271240234375, 0.2945404052734375, 0.317840576171875, 0.3411407470703125, 0.36444091796875, 0.3877410888671875, 0.411041259765625, 0.4343414306640625, 0.4576416015625, 0.4809417724609375, 0.504241943359375, 0.5275421142578125, 0.55084228515625, 0.5741424560546875, 0.597442626953125, 0.6207427978515625, 0.64404296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 17.0, 17.0, 20.0, 18.0, 29.0, 21.0, 34.0, 43.0, 50.0, 58.0, 74.0, 74.0, 53.0, 67.0, 69.0, 48.0, 49.0, 37.0, 48.0, 26.0, 20.0, 27.0, 21.0, 15.0, 8.0, 11.0, 8.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002773284912109375, -0.002696692943572998, -0.002620100975036621, -0.002543509006500244, -0.002466917037963867, -0.0023903250694274902, -0.0023137331008911133, -0.0022371411323547363, -0.0021605491638183594, -0.0020839571952819824, -0.0020073652267456055, -0.0019307732582092285, -0.0018541812896728516, -0.0017775893211364746, -0.0017009973526000977, -0.0016244053840637207, -0.0015478134155273438, -0.0014712214469909668, -0.0013946294784545898, -0.0013180375099182129, -0.001241445541381836, -0.001164853572845459, -0.001088261604309082, -0.001011669635772705, -0.0009350776672363281, -0.0008584856986999512, -0.0007818937301635742, -0.0007053017616271973, -0.0006287097930908203, -0.0005521178245544434, -0.0004755258560180664, -0.00039893388748168945, -0.0003223419189453125, -0.00024574995040893555, -0.0001691579818725586, -9.256601333618164e-05, -1.5974044799804688e-05, 6.0617923736572266e-05, 0.00013720989227294922, 0.00021380186080932617, 0.0002903938293457031, 0.0003669857978820801, 0.00044357776641845703, 0.000520169734954834, 0.0005967617034912109, 0.0006733536720275879, 0.0007499456405639648, 0.0008265376091003418, 0.0009031295776367188, 0.0009797215461730957, 0.0010563135147094727, 0.0011329054832458496, 0.0012094974517822266, 0.0012860894203186035, 0.0013626813888549805, 0.0014392733573913574, 0.0015158653259277344, 0.0015924572944641113, 0.0016690492630004883, 0.0017456412315368652, 0.0018222332000732422, 0.0018988251686096191, 0.001975417137145996, 0.002052009105682373, 0.00212860107421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 8.0, 7.0, 11.0, 13.0, 17.0, 19.0, 24.0, 47.0, 56.0, 81.0, 77.0, 124.0, 194.0, 511.0, 2013.0, 1008521.0, 35279.0, 748.0, 278.0, 153.0, 89.0, 59.0, 52.0, 36.0, 36.0, 28.0, 18.0, 16.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05291748046875, -0.05107593536376953, -0.04923439025878906, -0.047392845153808594, -0.045551300048828125, -0.043709754943847656, -0.04186820983886719, -0.04002666473388672, -0.03818511962890625, -0.03634357452392578, -0.03450202941894531, -0.032660484313964844, -0.030818939208984375, -0.028977394104003906, -0.027135848999023438, -0.02529430389404297, -0.0234527587890625, -0.02161121368408203, -0.019769668579101562, -0.017928123474121094, -0.016086578369140625, -0.014245033264160156, -0.012403488159179688, -0.010561943054199219, -0.00872039794921875, -0.006878852844238281, -0.0050373077392578125, -0.0031957626342773438, -0.001354217529296875, 0.00048732757568359375, 0.0023288726806640625, 0.004170417785644531, 0.006011962890625, 0.007853507995605469, 0.009695053100585938, 0.011536598205566406, 0.013378143310546875, 0.015219688415527344, 0.017061233520507812, 0.01890277862548828, 0.02074432373046875, 0.02258586883544922, 0.024427413940429688, 0.026268959045410156, 0.028110504150390625, 0.029952049255371094, 0.03179359436035156, 0.03363513946533203, 0.0354766845703125, 0.03731822967529297, 0.03915977478027344, 0.041001319885253906, 0.042842864990234375, 0.044684410095214844, 0.04652595520019531, 0.04836750030517578, 0.05020904541015625, 0.05205059051513672, 0.05389213562011719, 0.055733680725097656, 0.057575225830078125, 0.059416770935058594, 0.06125831604003906, 0.06309986114501953, 0.06494140625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 24.0, 98.0, 347.0, 360.0, 142.0, 34.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027707030531018972, -0.0026084640994668007, -0.0024462249130010605, -0.0022839857265353203, -0.0021217467729002237, -0.001959507819265127, -0.001797268632799387, -0.0016350295627489686, -0.0014727904926985502, -0.0013105514226481318, -0.0011483123525977135, -0.000986073282547295, -0.0008238342124968767, -0.0006615951424464583, -0.00049935607239604, -0.0003371170023456216, -0.0001748779322952032, -1.2638862244784832e-05, 0.00014960020780563354, 0.0003118392778560519, 0.0004740783479064703, 0.0006363174179568887, 0.000798556488007307, 0.0009607955580577254, 0.0011230346281081438, 0.0012852736981585622, 0.0014475127682089806, 0.001609751838259399, 0.0017719909083098173, 0.0019342299783602357, 0.002096469048410654, 0.0022587082348763943, 0.0024209474213421345, 0.0025831866078078747, 0.0027454255614429712, 0.0029076645150780678, 0.003069903701543808, 0.003232142888009548, 0.0033943818416446447, 0.0035566207952797413, 0.0037188599817454815, 0.0038810991682112217, 0.004043337889015675, 0.004205577075481415, 0.004367816261947155, 0.004530055448412895, 0.004692294634878635, 0.004854533355683088, 0.0050167725421488285, 0.005179011728614569, 0.005341250449419022, 0.005503489635884762, 0.005665728822350502, 0.005827968008816242, 0.005990207195281982, 0.006152445916086435, 0.0063146851025521755, 0.006476924289017916, 0.006639163009822369, 0.006801402196288109, 0.006963641382753849, 0.007125880569219589, 0.0072881197556853294, 0.007450358476489782, 0.0076125976629555225]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 16.0, 6.0, 14.0, 15.0, 14.0, 17.0, 25.0, 30.0, 27.0, 31.0, 31.0, 32.0, 38.0, 38.0, 31.0, 39.0, 28.0, 25.0, 45.0, 37.0, 37.0, 43.0, 31.0, 37.0, 24.0, 43.0, 36.0, 25.0, 29.0, 24.0, 15.0, 16.0, 20.0, 10.0, 13.0, 7.0, 7.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001285254955291748, -0.0012497790157794952, -0.0012143030762672424, -0.0011788271367549896, -0.0011433511972427368, -0.001107875257730484, -0.0010723993182182312, -0.0010369233787059784, -0.0010014474391937256, -0.0009659714996814728, -0.00093049556016922, -0.0008950196206569672, -0.0008595436811447144, -0.0008240677416324615, -0.0007885918021202087, -0.0007531158626079559, -0.0007176399230957031, -0.0006821639835834503, -0.0006466880440711975, -0.0006112121045589447, -0.0005757361650466919, -0.0005402602255344391, -0.0005047842860221863, -0.00046930834650993347, -0.00043383240699768066, -0.00039835646748542786, -0.00036288052797317505, -0.00032740458846092224, -0.00029192864894866943, -0.0002564527094364166, -0.00022097676992416382, -0.000185500830411911, -0.0001500248908996582, -0.0001145489513874054, -7.907301187515259e-05, -4.359707236289978e-05, -8.121132850646973e-06, 2.7354806661605835e-05, 6.283074617385864e-05, 9.830668568611145e-05, 0.00013378262519836426, 0.00016925856471061707, 0.00020473450422286987, 0.00024021044373512268, 0.0002756863832473755, 0.0003111623227596283, 0.0003466382622718811, 0.0003821142017841339, 0.0004175901412963867, 0.0004530660808086395, 0.0004885420203208923, 0.0005240179598331451, 0.000559493899345398, 0.0005949698388576508, 0.0006304457783699036, 0.0006659217178821564, 0.0007013976573944092, 0.000736873596906662, 0.0007723495364189148, 0.0008078254759311676, 0.0008433014154434204, 0.0008787773549556732, 0.000914253294467926, 0.0009497292339801788, 0.0009852051734924316]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 9.0, 8.0, 8.0, 13.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 24.0, 26.0, 39.0, 17.0, 31.0, 24.0, 28.0, 33.0, 48.0, 36.0, 34.0, 43.0, 37.0, 32.0, 34.0, 27.0, 31.0, 32.0, 28.0, 36.0, 23.0, 23.0, 19.0, 21.0, 18.0, 18.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-5.20703125, -5.04876708984375, -4.8905029296875, -4.73223876953125, -4.573974609375, -4.41571044921875, -4.2574462890625, -4.09918212890625, -3.94091796875, -3.78265380859375, -3.6243896484375, -3.46612548828125, -3.307861328125, -3.14959716796875, -2.9913330078125, -2.83306884765625, -2.6748046875, -2.51654052734375, -2.3582763671875, -2.20001220703125, -2.041748046875, -1.88348388671875, -1.7252197265625, -1.56695556640625, -1.40869140625, -1.25042724609375, -1.0921630859375, -0.93389892578125, -0.775634765625, -0.61737060546875, -0.4591064453125, -0.30084228515625, -0.142578125, 0.01568603515625, 0.1739501953125, 0.33221435546875, 0.490478515625, 0.64874267578125, 0.8070068359375, 0.96527099609375, 1.12353515625, 1.28179931640625, 1.4400634765625, 1.59832763671875, 1.756591796875, 1.91485595703125, 2.0731201171875, 2.23138427734375, 2.3896484375, 2.54791259765625, 2.7061767578125, 2.86444091796875, 3.022705078125, 3.18096923828125, 3.3392333984375, 3.49749755859375, 3.65576171875, 3.81402587890625, 3.9722900390625, 4.13055419921875, 4.288818359375, 4.44708251953125, 4.6053466796875, 4.76361083984375, 4.921875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 2.0, 9.0, 7.0, 6.0, 16.0, 19.0, 20.0, 26.0, 26.0, 30.0, 45.0, 73.0, 104.0, 196.0, 358.0, 712.0, 1455.0, 3194.0, 7179.0, 16085.0, 35281.0, 81149.0, 217841.0, 391580.0, 171807.0, 66966.0, 29733.0, 13318.0, 5899.0, 2730.0, 1238.0, 586.0, 303.0, 165.0, 113.0, 71.0, 40.0, 30.0, 39.0, 10.0, 24.0, 12.0, 11.0, 16.0, 4.0, 8.0, 6.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.890625, -4.7396240234375, -4.588623046875, -4.4376220703125, -4.28662109375, -4.1356201171875, -3.984619140625, -3.8336181640625, -3.6826171875, -3.5316162109375, -3.380615234375, -3.2296142578125, -3.07861328125, -2.9276123046875, -2.776611328125, -2.6256103515625, -2.474609375, -2.3236083984375, -2.172607421875, -2.0216064453125, -1.87060546875, -1.7196044921875, -1.568603515625, -1.4176025390625, -1.2666015625, -1.1156005859375, -0.964599609375, -0.8135986328125, -0.66259765625, -0.5115966796875, -0.360595703125, -0.2095947265625, -0.05859375, 0.0924072265625, 0.243408203125, 0.3944091796875, 0.54541015625, 0.6964111328125, 0.847412109375, 0.9984130859375, 1.1494140625, 1.3004150390625, 1.451416015625, 1.6024169921875, 1.75341796875, 1.9044189453125, 2.055419921875, 2.2064208984375, 2.357421875, 2.5084228515625, 2.659423828125, 2.8104248046875, 2.96142578125, 3.1124267578125, 3.263427734375, 3.4144287109375, 3.5654296875, 3.7164306640625, 3.867431640625, 4.0184326171875, 4.16943359375, 4.3204345703125, 4.471435546875, 4.6224365234375, 4.7734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 3.0, 5.0, 12.0, 10.0, 16.0, 15.0, 22.0, 14.0, 23.0, 29.0, 19.0, 33.0, 30.0, 37.0, 48.0, 56.0, 64.0, 134.0, 1480.0, 392.0, 112.0, 65.0, 51.0, 46.0, 32.0, 34.0, 31.0, 21.0, 22.0, 31.0, 29.0, 15.0, 19.0, 15.0, 19.0, 8.0, 5.0, 9.0, 11.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.734375, -18.165283203125, -17.59619140625, -17.027099609375, -16.4580078125, -15.888916015625, -15.31982421875, -14.750732421875, -14.181640625, -13.612548828125, -13.04345703125, -12.474365234375, -11.9052734375, -11.336181640625, -10.76708984375, -10.197998046875, -9.62890625, -9.059814453125, -8.49072265625, -7.921630859375, -7.3525390625, -6.783447265625, -6.21435546875, -5.645263671875, -5.076171875, -4.507080078125, -3.93798828125, -3.368896484375, -2.7998046875, -2.230712890625, -1.66162109375, -1.092529296875, -0.5234375, 0.045654296875, 0.61474609375, 1.183837890625, 1.7529296875, 2.322021484375, 2.89111328125, 3.460205078125, 4.029296875, 4.598388671875, 5.16748046875, 5.736572265625, 6.3056640625, 6.874755859375, 7.44384765625, 8.012939453125, 8.58203125, 9.151123046875, 9.72021484375, 10.289306640625, 10.8583984375, 11.427490234375, 11.99658203125, 12.565673828125, 13.134765625, 13.703857421875, 14.27294921875, 14.842041015625, 15.4111328125, 15.980224609375, 16.54931640625, 17.118408203125, 17.6875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 5.0, 6.0, 13.0, 11.0, 14.0, 11.0, 24.0, 25.0, 31.0, 50.0, 55.0, 72.0, 76.0, 104.0, 134.0, 180.0, 260.0, 421.0, 911.0, 8723.0, 2652769.0, 475527.0, 4230.0, 795.0, 395.0, 215.0, 156.0, 106.0, 82.0, 65.0, 54.0, 34.0, 32.0, 29.0, 21.0, 13.0, 8.0, 8.0, 11.0, 11.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.948974609375, -29.91357421875, -28.878173828125, -27.8427734375, -26.807373046875, -25.77197265625, -24.736572265625, -23.701171875, -22.665771484375, -21.63037109375, -20.594970703125, -19.5595703125, -18.524169921875, -17.48876953125, -16.453369140625, -15.41796875, -14.382568359375, -13.34716796875, -12.311767578125, -11.2763671875, -10.240966796875, -9.20556640625, -8.170166015625, -7.134765625, -6.099365234375, -5.06396484375, -4.028564453125, -2.9931640625, -1.957763671875, -0.92236328125, 0.113037109375, 1.1484375, 2.183837890625, 3.21923828125, 4.254638671875, 5.2900390625, 6.325439453125, 7.36083984375, 8.396240234375, 9.431640625, 10.467041015625, 11.50244140625, 12.537841796875, 13.5732421875, 14.608642578125, 15.64404296875, 16.679443359375, 17.71484375, 18.750244140625, 19.78564453125, 20.821044921875, 21.8564453125, 22.891845703125, 23.92724609375, 24.962646484375, 25.998046875, 27.033447265625, 28.06884765625, 29.104248046875, 30.1396484375, 31.175048828125, 32.21044921875, 33.245849609375, 34.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 164.0, 597.0, 227.0, 19.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.780529022216797, -10.007795333862305, -7.235060691833496, -4.4623260498046875, -1.6895923614501953, 1.0831413269042969, 3.855876922607422, 6.628610610961914, 9.401344299316406, 12.174077987670898, 14.946812629699707, 17.719547271728516, 20.492280960083008, 23.2650146484375, 26.037750244140625, 28.810483932495117, 31.58321762084961, 34.355953216552734, 37.128684997558594, 39.90142059326172, 42.674156188964844, 45.4468879699707, 48.21962356567383, 50.99235534667969, 53.76509094238281, 56.53782653808594, 59.3105583190918, 62.08329391479492, 64.85602569580078, 67.6287612915039, 70.40149688720703, 73.17423248291016, 75.94696044921875, 78.71969604492188, 81.492431640625, 84.26516723632812, 87.03789520263672, 89.81063079833984, 92.58336639404297, 95.3561019897461, 98.12882995605469, 100.90156555175781, 103.67430114746094, 106.44703674316406, 109.21976470947266, 111.99250030517578, 114.7652359008789, 117.53797149658203, 120.31070709228516, 123.08344268798828, 125.8561782836914, 128.62890625, 131.40164184570312, 134.17437744140625, 136.94711303710938, 139.7198486328125, 142.49258422851562, 145.26531982421875, 148.03805541992188, 150.810791015625, 153.58352661132812, 156.35626220703125, 159.12899780273438, 161.90171813964844, 164.67445373535156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 8.0, 11.0, 12.0, 12.0, 19.0, 19.0, 27.0, 29.0, 31.0, 42.0, 38.0, 39.0, 37.0, 36.0, 39.0, 54.0, 45.0, 42.0, 42.0, 34.0, 30.0, 44.0, 42.0, 32.0, 24.0, 27.0, 21.0, 22.0, 18.0, 14.0, 9.0, 15.0, 12.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-53.05552291870117, -51.49504089355469, -49.93455505371094, -48.37407302856445, -46.81359100341797, -45.253108978271484, -43.692623138427734, -42.13214111328125, -40.571659088134766, -39.01117706298828, -37.45069122314453, -35.89020919799805, -34.32972717285156, -32.76924514770508, -31.208759307861328, -29.648277282714844, -28.087793350219727, -26.52730941772461, -24.966827392578125, -23.406343460083008, -21.845861434936523, -20.285377502441406, -18.724895477294922, -17.164411544799805, -15.603928565979004, -14.043445587158203, -12.482962608337402, -10.922479629516602, -9.361995697021484, -7.801513195037842, -6.241029739379883, -4.680546760559082, -3.1200637817382812, -1.559580683708191, 0.0009024143218994141, 1.5613856315612793, 3.12186861038208, 4.682351589202881, 6.24283504486084, 7.803318023681641, 9.363801002502441, 10.924283981323242, 12.484766960144043, 14.045249938964844, 15.605733871459961, 17.166215896606445, 18.726699829101562, 20.287181854248047, 21.847665786743164, 23.40814971923828, 24.968631744384766, 26.529115676879883, 28.089597702026367, 29.650081634521484, 31.21056365966797, 32.77104949951172, 34.3315315246582, 35.89201354980469, 37.45249938964844, 39.01298141479492, 40.573463439941406, 42.13394546508789, 43.69443130493164, 45.254913330078125, 46.81539535522461]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 5.0, 7.0, 7.0, 11.0, 13.0, 14.0, 16.0, 9.0, 16.0, 17.0, 18.0, 32.0, 24.0, 23.0, 27.0, 27.0, 43.0, 36.0, 40.0, 33.0, 38.0, 41.0, 30.0, 31.0, 34.0, 41.0, 34.0, 26.0, 36.0, 25.0, 25.0, 32.0, 21.0, 16.0, 24.0, 10.0, 18.0, 22.0, 8.0, 9.0, 9.0, 12.0, 9.0, 6.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.94158935546875, -4.7777099609375, -4.61383056640625, -4.449951171875, -4.28607177734375, -4.1221923828125, -3.95831298828125, -3.79443359375, -3.63055419921875, -3.4666748046875, -3.30279541015625, -3.138916015625, -2.97503662109375, -2.8111572265625, -2.64727783203125, -2.4833984375, -2.31951904296875, -2.1556396484375, -1.99176025390625, -1.827880859375, -1.66400146484375, -1.5001220703125, -1.33624267578125, -1.17236328125, -1.00848388671875, -0.8446044921875, -0.68072509765625, -0.516845703125, -0.35296630859375, -0.1890869140625, -0.02520751953125, 0.138671875, 0.30255126953125, 0.4664306640625, 0.63031005859375, 0.794189453125, 0.95806884765625, 1.1219482421875, 1.28582763671875, 1.44970703125, 1.61358642578125, 1.7774658203125, 1.94134521484375, 2.105224609375, 2.26910400390625, 2.4329833984375, 2.59686279296875, 2.7607421875, 2.92462158203125, 3.0885009765625, 3.25238037109375, 3.416259765625, 3.58013916015625, 3.7440185546875, 3.90789794921875, 4.07177734375, 4.23565673828125, 4.3995361328125, 4.56341552734375, 4.727294921875, 4.89117431640625, 5.0550537109375, 5.21893310546875, 5.3828125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 12.0, 13.0, 11.0, 12.0, 14.0, 25.0, 25.0, 31.0, 24.0, 38.0, 51.0, 66.0, 84.0, 147.0, 234.0, 738.0, 4486.0, 47685.0, 1295290.0, 2696876.0, 136426.0, 9594.0, 1432.0, 342.0, 145.0, 99.0, 84.0, 42.0, 37.0, 40.0, 32.0, 24.0, 20.0, 21.0, 16.0, 12.0, 7.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.578125, -17.03173828125, -16.4853515625, -15.93896484375, -15.392578125, -14.84619140625, -14.2998046875, -13.75341796875, -13.20703125, -12.66064453125, -12.1142578125, -11.56787109375, -11.021484375, -10.47509765625, -9.9287109375, -9.38232421875, -8.8359375, -8.28955078125, -7.7431640625, -7.19677734375, -6.650390625, -6.10400390625, -5.5576171875, -5.01123046875, -4.46484375, -3.91845703125, -3.3720703125, -2.82568359375, -2.279296875, -1.73291015625, -1.1865234375, -0.64013671875, -0.09375, 0.45263671875, 0.9990234375, 1.54541015625, 2.091796875, 2.63818359375, 3.1845703125, 3.73095703125, 4.27734375, 4.82373046875, 5.3701171875, 5.91650390625, 6.462890625, 7.00927734375, 7.5556640625, 8.10205078125, 8.6484375, 9.19482421875, 9.7412109375, 10.28759765625, 10.833984375, 11.38037109375, 11.9267578125, 12.47314453125, 13.01953125, 13.56591796875, 14.1123046875, 14.65869140625, 15.205078125, 15.75146484375, 16.2978515625, 16.84423828125, 17.390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 13.0, 15.0, 23.0, 36.0, 47.0, 67.0, 99.0, 134.0, 189.0, 237.0, 304.0, 406.0, 473.0, 523.0, 392.0, 300.0, 208.0, 140.0, 113.0, 87.0, 68.0, 37.0, 43.0, 28.0, 24.0, 16.0, 11.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.46728515625, -10.1376953125, -9.80810546875, -9.478515625, -9.14892578125, -8.8193359375, -8.48974609375, -8.16015625, -7.83056640625, -7.5009765625, -7.17138671875, -6.841796875, -6.51220703125, -6.1826171875, -5.85302734375, -5.5234375, -5.19384765625, -4.8642578125, -4.53466796875, -4.205078125, -3.87548828125, -3.5458984375, -3.21630859375, -2.88671875, -2.55712890625, -2.2275390625, -1.89794921875, -1.568359375, -1.23876953125, -0.9091796875, -0.57958984375, -0.25, 0.07958984375, 0.4091796875, 0.73876953125, 1.068359375, 1.39794921875, 1.7275390625, 2.05712890625, 2.38671875, 2.71630859375, 3.0458984375, 3.37548828125, 3.705078125, 4.03466796875, 4.3642578125, 4.69384765625, 5.0234375, 5.35302734375, 5.6826171875, 6.01220703125, 6.341796875, 6.67138671875, 7.0009765625, 7.33056640625, 7.66015625, 7.98974609375, 8.3193359375, 8.64892578125, 8.978515625, 9.30810546875, 9.6376953125, 9.96728515625, 10.296875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 12.0, 14.0, 13.0, 28.0, 24.0, 34.0, 49.0, 63.0, 71.0, 97.0, 113.0, 172.0, 210.0, 278.0, 437.0, 1140.0, 17167.0, 3690034.0, 477878.0, 4369.0, 712.0, 357.0, 243.0, 169.0, 130.0, 110.0, 76.0, 69.0, 37.0, 40.0, 32.0, 29.0, 18.0, 15.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.96875, -45.537109375, -44.10546875, -42.673828125, -41.2421875, -39.810546875, -38.37890625, -36.947265625, -35.515625, -34.083984375, -32.65234375, -31.220703125, -29.7890625, -28.357421875, -26.92578125, -25.494140625, -24.0625, -22.630859375, -21.19921875, -19.767578125, -18.3359375, -16.904296875, -15.47265625, -14.041015625, -12.609375, -11.177734375, -9.74609375, -8.314453125, -6.8828125, -5.451171875, -4.01953125, -2.587890625, -1.15625, 0.275390625, 1.70703125, 3.138671875, 4.5703125, 6.001953125, 7.43359375, 8.865234375, 10.296875, 11.728515625, 13.16015625, 14.591796875, 16.0234375, 17.455078125, 18.88671875, 20.318359375, 21.75, 23.181640625, 24.61328125, 26.044921875, 27.4765625, 28.908203125, 30.33984375, 31.771484375, 33.203125, 34.634765625, 36.06640625, 37.498046875, 38.9296875, 40.361328125, 41.79296875, 43.224609375, 44.65625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 25.0, 143.0, 448.0, 324.0, 67.0, 10.0, 0.0, 2.0], "bins": [-276.5811767578125, -271.86993408203125, -267.1587219238281, -262.447509765625, -257.73626708984375, -253.02503967285156, -248.31381225585938, -243.6025848388672, -238.891357421875, -234.1801300048828, -229.46890258789062, -224.75767517089844, -220.04644775390625, -215.33522033691406, -210.62399291992188, -205.9127655029297, -201.2015380859375, -196.4903106689453, -191.77908325195312, -187.06785583496094, -182.35662841796875, -177.64540100097656, -172.93417358398438, -168.2229461669922, -163.51171875, -158.8004913330078, -154.08926391601562, -149.37803649902344, -144.66680908203125, -139.95558166503906, -135.24435424804688, -130.5331268310547, -125.82190704345703, -121.11067962646484, -116.39945220947266, -111.68822479248047, -106.97699737548828, -102.2657699584961, -97.5545425415039, -92.84331512451172, -88.13208770751953, -83.42086029052734, -78.70963287353516, -73.99840545654297, -69.28717803955078, -64.5759506225586, -59.864723205566406, -55.15349578857422, -50.44226837158203, -45.731040954589844, -41.019813537597656, -36.30858612060547, -31.59735870361328, -26.886131286621094, -22.174903869628906, -17.46367645263672, -12.752447128295898, -8.041219711303711, -3.3299922943115234, 1.381235122680664, 6.092462539672852, 10.803689956665039, 15.514917373657227, 20.226144790649414, 24.9373722076416]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 7.0, 5.0, 6.0, 9.0, 9.0, 9.0, 16.0, 16.0, 23.0, 25.0, 30.0, 27.0, 34.0, 37.0, 41.0, 34.0, 40.0, 47.0, 39.0, 35.0, 51.0, 45.0, 41.0, 49.0, 24.0, 35.0, 31.0, 37.0, 31.0, 27.0, 25.0, 22.0, 23.0, 15.0, 12.0, 13.0, 5.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.204925537109375, -32.067684173583984, -30.930438995361328, -29.793197631835938, -28.655954360961914, -27.51871109008789, -26.3814697265625, -25.244226455688477, -24.106983184814453, -22.96973991394043, -21.832496643066406, -20.695255279541016, -19.558012008666992, -18.42076873779297, -17.283527374267578, -16.146284103393555, -15.009040832519531, -13.871797561645508, -12.7345552444458, -11.597312927246094, -10.46006965637207, -9.322826385498047, -8.18558406829834, -7.048341274261475, -5.911098480224609, -4.773855686187744, -3.636612892150879, -2.4993700981140137, -1.3621273040771484, -0.2248845100402832, 0.912358283996582, 2.0496010780334473, 3.1868438720703125, 4.324086666107178, 5.461329460144043, 6.598572254180908, 7.735815048217773, 8.873058319091797, 10.010300636291504, 11.147542953491211, 12.284786224365234, 13.422029495239258, 14.559271812438965, 15.696514129638672, 16.833757400512695, 17.97100067138672, 19.10824203491211, 20.245485305786133, 21.382728576660156, 22.51997184753418, 23.657215118408203, 24.794456481933594, 25.931699752807617, 27.06894302368164, 28.20618438720703, 29.343427658081055, 30.480670928955078, 31.6179141998291, 32.755157470703125, 33.892398834228516, 35.029640197753906, 36.16688537597656, 37.30412673950195, 38.44137191772461, 39.57861328125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 8.0, 12.0, 23.0, 20.0, 14.0, 21.0, 25.0, 39.0, 26.0, 47.0, 32.0, 36.0, 30.0, 30.0, 42.0, 34.0, 37.0, 42.0, 36.0, 47.0, 30.0, 32.0, 38.0, 28.0, 33.0, 23.0, 21.0, 23.0, 13.0, 16.0, 19.0, 15.0, 11.0, 11.0, 5.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50750732421875, -5.3353271484375, -5.16314697265625, -4.990966796875, -4.81878662109375, -4.6466064453125, -4.47442626953125, -4.30224609375, -4.13006591796875, -3.9578857421875, -3.78570556640625, -3.613525390625, -3.44134521484375, -3.2691650390625, -3.09698486328125, -2.9248046875, -2.75262451171875, -2.5804443359375, -2.40826416015625, -2.236083984375, -2.06390380859375, -1.8917236328125, -1.71954345703125, -1.54736328125, -1.37518310546875, -1.2030029296875, -1.03082275390625, -0.858642578125, -0.68646240234375, -0.5142822265625, -0.34210205078125, -0.169921875, 0.00225830078125, 0.1744384765625, 0.34661865234375, 0.518798828125, 0.69097900390625, 0.8631591796875, 1.03533935546875, 1.20751953125, 1.37969970703125, 1.5518798828125, 1.72406005859375, 1.896240234375, 2.06842041015625, 2.2406005859375, 2.41278076171875, 2.5849609375, 2.75714111328125, 2.9293212890625, 3.10150146484375, 3.273681640625, 3.44586181640625, 3.6180419921875, 3.79022216796875, 3.96240234375, 4.13458251953125, 4.3067626953125, 4.47894287109375, 4.651123046875, 4.82330322265625, 4.9954833984375, 5.16766357421875, 5.33984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 13.0, 17.0, 39.0, 41.0, 49.0, 89.0, 97.0, 194.0, 285.0, 390.0, 578.0, 879.0, 1193.0, 1874.0, 2462.0, 3613.0, 5122.0, 7358.0, 10337.0, 15077.0, 21832.0, 33213.0, 50357.0, 78240.0, 125765.0, 181695.0, 173662.0, 115995.0, 73240.0, 46882.0, 30613.0, 20553.0, 14029.0, 9908.0, 6824.0, 4770.0, 3564.0, 2363.0, 1698.0, 1162.0, 813.0, 523.0, 366.0, 253.0, 178.0, 111.0, 67.0, 57.0, 40.0, 29.0, 21.0, 7.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.65478515625, -0.6342697143554688, -0.6137542724609375, -0.5932388305664062, -0.572723388671875, -0.5522079467773438, -0.5316925048828125, -0.5111770629882812, -0.49066162109375, -0.47014617919921875, -0.4496307373046875, -0.42911529541015625, -0.408599853515625, -0.38808441162109375, -0.3675689697265625, -0.34705352783203125, -0.3265380859375, -0.30602264404296875, -0.2855072021484375, -0.26499176025390625, -0.244476318359375, -0.22396087646484375, -0.2034454345703125, -0.18292999267578125, -0.16241455078125, -0.14189910888671875, -0.1213836669921875, -0.10086822509765625, -0.080352783203125, -0.05983734130859375, -0.0393218994140625, -0.01880645751953125, 0.001708984375, 0.02222442626953125, 0.0427398681640625, 0.06325531005859375, 0.083770751953125, 0.10428619384765625, 0.1248016357421875, 0.14531707763671875, 0.16583251953125, 0.18634796142578125, 0.2068634033203125, 0.22737884521484375, 0.247894287109375, 0.26840972900390625, 0.2889251708984375, 0.30944061279296875, 0.3299560546875, 0.35047149658203125, 0.3709869384765625, 0.39150238037109375, 0.412017822265625, 0.43253326416015625, 0.4530487060546875, 0.47356414794921875, 0.49407958984375, 0.5145950317382812, 0.5351104736328125, 0.5556259155273438, 0.576141357421875, 0.5966567993164062, 0.6171722412109375, 0.6376876831054688, 0.658203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 11.0, 5.0, 13.0, 12.0, 12.0, 11.0, 23.0, 15.0, 22.0, 27.0, 19.0, 29.0, 43.0, 46.0, 40.0, 36.0, 35.0, 46.0, 41.0, 1061.0, 42.0, 40.0, 33.0, 44.0, 37.0, 38.0, 33.0, 36.0, 23.0, 20.0, 26.0, 18.0, 12.0, 15.0, 12.0, 9.0, 10.0, 5.0, 8.0, 6.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.970977783203125, -3.84820556640625, -3.725433349609375, -3.6026611328125, -3.479888916015625, -3.35711669921875, -3.234344482421875, -3.111572265625, -2.988800048828125, -2.86602783203125, -2.743255615234375, -2.6204833984375, -2.497711181640625, -2.37493896484375, -2.252166748046875, -2.12939453125, -2.006622314453125, -1.88385009765625, -1.761077880859375, -1.6383056640625, -1.515533447265625, -1.39276123046875, -1.269989013671875, -1.147216796875, -1.024444580078125, -0.90167236328125, -0.778900146484375, -0.6561279296875, -0.533355712890625, -0.41058349609375, -0.287811279296875, -0.1650390625, -0.042266845703125, 0.08050537109375, 0.203277587890625, 0.3260498046875, 0.448822021484375, 0.57159423828125, 0.694366455078125, 0.817138671875, 0.939910888671875, 1.06268310546875, 1.185455322265625, 1.3082275390625, 1.430999755859375, 1.55377197265625, 1.676544189453125, 1.79931640625, 1.922088623046875, 2.04486083984375, 2.167633056640625, 2.2904052734375, 2.413177490234375, 2.53594970703125, 2.658721923828125, 2.781494140625, 2.904266357421875, 3.02703857421875, 3.149810791015625, 3.2725830078125, 3.395355224609375, 3.51812744140625, 3.640899658203125, 3.763671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 12.0, 3.0, 13.0, 14.0, 25.0, 35.0, 50.0, 90.0, 139.0, 243.0, 393.0, 673.0, 1019.0, 1683.0, 2877.0, 4872.0, 8283.0, 14103.0, 24256.0, 43485.0, 78151.0, 146047.0, 1281594.0, 212865.0, 122995.0, 65772.0, 36871.0, 20979.0, 12051.0, 7149.0, 4118.0, 2398.0, 1483.0, 871.0, 563.0, 337.0, 229.0, 131.0, 81.0, 51.0, 54.0, 24.0, 16.0, 8.0, 8.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7458572387695312, -0.7231597900390625, -0.7004623413085938, -0.677764892578125, -0.6550674438476562, -0.6323699951171875, -0.6096725463867188, -0.58697509765625, -0.5642776489257812, -0.5415802001953125, -0.5188827514648438, -0.496185302734375, -0.47348785400390625, -0.4507904052734375, -0.42809295654296875, -0.4053955078125, -0.38269805908203125, -0.3600006103515625, -0.33730316162109375, -0.314605712890625, -0.29190826416015625, -0.2692108154296875, -0.24651336669921875, -0.22381591796875, -0.20111846923828125, -0.1784210205078125, -0.15572357177734375, -0.133026123046875, -0.11032867431640625, -0.0876312255859375, -0.06493377685546875, -0.042236328125, -0.01953887939453125, 0.0031585693359375, 0.02585601806640625, 0.048553466796875, 0.07125091552734375, 0.0939483642578125, 0.11664581298828125, 0.13934326171875, 0.16204071044921875, 0.1847381591796875, 0.20743560791015625, 0.230133056640625, 0.25283050537109375, 0.2755279541015625, 0.29822540283203125, 0.3209228515625, 0.34362030029296875, 0.3663177490234375, 0.38901519775390625, 0.411712646484375, 0.43441009521484375, 0.4571075439453125, 0.47980499267578125, 0.50250244140625, 0.5251998901367188, 0.5478973388671875, 0.5705947875976562, 0.593292236328125, 0.6159896850585938, 0.6386871337890625, 0.6613845825195312, 0.68408203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 1.0, 4.0, 1.0, 8.0, 4.0, 14.0, 8.0, 14.0, 10.0, 16.0, 23.0, 25.0, 32.0, 37.0, 42.0, 37.0, 48.0, 55.0, 52.0, 59.0, 39.0, 69.0, 59.0, 46.0, 37.0, 31.0, 41.0, 37.0, 34.0, 20.0, 15.0, 12.0, 11.0, 8.0, 9.0, 8.0, 8.0, 7.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019006729125976562, -0.0018430203199386597, -0.001785367727279663, -0.0017277151346206665, -0.00167006254196167, -0.0016124099493026733, -0.0015547573566436768, -0.0014971047639846802, -0.0014394521713256836, -0.001381799578666687, -0.0013241469860076904, -0.0012664943933486938, -0.0012088418006896973, -0.0011511892080307007, -0.001093536615371704, -0.0010358840227127075, -0.000978231430053711, -0.0009205788373947144, -0.0008629262447357178, -0.0008052736520767212, -0.0007476210594177246, -0.000689968466758728, -0.0006323158740997314, -0.0005746632814407349, -0.0005170106887817383, -0.0004593580961227417, -0.0004017055034637451, -0.00034405291080474854, -0.00028640031814575195, -0.00022874772548675537, -0.0001710951328277588, -0.00011344254016876221, -5.5789947509765625e-05, 1.862645149230957e-06, 5.951523780822754e-05, 0.00011716783046722412, 0.0001748204231262207, 0.00023247301578521729, 0.00029012560844421387, 0.00034777820110321045, 0.00040543079376220703, 0.0004630833864212036, 0.0005207359790802002, 0.0005783885717391968, 0.0006360411643981934, 0.0006936937570571899, 0.0007513463497161865, 0.0008089989423751831, 0.0008666515350341797, 0.0009243041276931763, 0.0009819567203521729, 0.0010396093130111694, 0.001097261905670166, 0.0011549144983291626, 0.0012125670909881592, 0.0012702196836471558, 0.0013278722763061523, 0.001385524868965149, 0.0014431774616241455, 0.001500830054283142, 0.0015584826469421387, 0.0016161352396011353, 0.0016737878322601318, 0.0017314404249191284, 0.001789093017578125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 8.0, 14.0, 13.0, 18.0, 26.0, 31.0, 33.0, 43.0, 56.0, 69.0, 98.0, 131.0, 213.0, 368.0, 980.0, 49957.0, 990377.0, 4551.0, 605.0, 279.0, 156.0, 135.0, 77.0, 53.0, 43.0, 35.0, 30.0, 40.0, 15.0, 19.0, 12.0, 11.0, 7.0, 6.0, 8.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04083251953125, -0.03952789306640625, -0.0382232666015625, -0.03691864013671875, -0.035614013671875, -0.03430938720703125, -0.0330047607421875, -0.03170013427734375, -0.0303955078125, -0.02909088134765625, -0.0277862548828125, -0.02648162841796875, -0.025177001953125, -0.02387237548828125, -0.0225677490234375, -0.02126312255859375, -0.01995849609375, -0.01865386962890625, -0.0173492431640625, -0.01604461669921875, -0.014739990234375, -0.01343536376953125, -0.0121307373046875, -0.01082611083984375, -0.009521484375, -0.00821685791015625, -0.0069122314453125, -0.00560760498046875, -0.004302978515625, -0.00299835205078125, -0.0016937255859375, -0.00038909912109375, 0.00091552734375, 0.00222015380859375, 0.0035247802734375, 0.00482940673828125, 0.006134033203125, 0.00743865966796875, 0.0087432861328125, 0.01004791259765625, 0.0113525390625, 0.01265716552734375, 0.0139617919921875, 0.01526641845703125, 0.016571044921875, 0.01787567138671875, 0.0191802978515625, 0.02048492431640625, 0.02178955078125, 0.02309417724609375, 0.0243988037109375, 0.02570343017578125, 0.027008056640625, 0.02831268310546875, 0.0296173095703125, 0.03092193603515625, 0.0322265625, 0.03353118896484375, 0.0348358154296875, 0.03614044189453125, 0.037445068359375, 0.03874969482421875, 0.0400543212890625, 0.04135894775390625, 0.04266357421875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 24.0, 943.0, 48.0, 1.0, 0.0, 1.0], "bins": [-0.036522723734378815, -0.035909418016672134, -0.035296108573675156, -0.034682802855968475, -0.0340694934129715, -0.033456187695264816, -0.032842881977558136, -0.03222957253456116, -0.03161626681685448, -0.031002959236502647, -0.030389651656150818, -0.029776345938444138, -0.029163038358092308, -0.02854973077774048, -0.027936425060033798, -0.02732311747968197, -0.02670980989933014, -0.02609650231897831, -0.02548319473862648, -0.0248698890209198, -0.02425658144056797, -0.02364327386021614, -0.02302996814250946, -0.02241666056215763, -0.0218033529818058, -0.021190045401453972, -0.020576737821102142, -0.019963432103395462, -0.019350124523043633, -0.018736816942691803, -0.018123511224985123, -0.017510203644633293, -0.016896894201636314, -0.016283586621284485, -0.015670280903577805, -0.015056973323225975, -0.014443665742874146, -0.013830358162522316, -0.013217051513493061, -0.012603744864463806, -0.011990437284111977, -0.011377129703760147, -0.010763823054730892, -0.010150516405701637, -0.009537208825349808, -0.008923901244997978, -0.008310594595968723, -0.007697287481278181, -0.007083980366587639, -0.006470673251897097, -0.005857366137206554, -0.005244059022516012, -0.00463075190782547, -0.004017444793134928, -0.0034041376784443855, -0.0027908305637538433, -0.002177523449063301, -0.0015642163343727589, -0.0009509092196822166, -0.0003376021049916744, 0.0002757050096988678, 0.00088901212438941, 0.0015023192390799522, 0.0021156263537704945, 0.0027289334684610367]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 12.0, 15.0, 26.0, 29.0, 32.0, 43.0, 53.0, 65.0, 54.0, 64.0, 70.0, 62.0, 70.0, 69.0, 54.0, 49.0, 55.0, 37.0, 25.0, 25.0, 30.0, 24.0, 8.0, 7.0, 11.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011633038520812988, -0.0011096522212028503, -0.0010560005903244019, -0.0010023489594459534, -0.0009486973285675049, -0.0008950456976890564, -0.0008413940668106079, -0.0007877424359321594, -0.0007340908050537109, -0.0006804391741752625, -0.000626787543296814, -0.0005731359124183655, -0.000519484281539917, -0.0004658326506614685, -0.00041218101978302, -0.00035852938890457153, -0.00030487775802612305, -0.00025122612714767456, -0.00019757449626922607, -0.0001439228653907776, -9.02712345123291e-05, -3.6619603633880615e-05, 1.703202724456787e-05, 7.068365812301636e-05, 0.00012433528900146484, 0.00017798691987991333, 0.00023163855075836182, 0.0002852901816368103, 0.0003389418125152588, 0.0003925934433937073, 0.00044624507427215576, 0.0004998967051506042, 0.0005535483360290527, 0.0006071999669075012, 0.0006608515977859497, 0.0007145032286643982, 0.0007681548595428467, 0.0008218064904212952, 0.0008754581212997437, 0.0009291097521781921, 0.0009827613830566406, 0.0010364130139350891, 0.0010900646448135376, 0.001143716275691986, 0.0011973679065704346, 0.001251019537448883, 0.0013046711683273315, 0.00135832279920578, 0.0014119744300842285, 0.001465626060962677, 0.0015192776918411255, 0.001572929322719574, 0.0016265809535980225, 0.001680232584476471, 0.0017338842153549194, 0.001787535846233368, 0.0018411874771118164, 0.001894839107990265, 0.0019484907388687134, 0.002002142369747162, 0.0020557940006256104, 0.002109445631504059, 0.0021630972623825073, 0.002216748893260956, 0.0022704005241394043]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 8.0, 12.0, 23.0, 20.0, 14.0, 21.0, 25.0, 39.0, 26.0, 47.0, 32.0, 36.0, 30.0, 30.0, 42.0, 34.0, 37.0, 42.0, 36.0, 47.0, 30.0, 32.0, 38.0, 28.0, 33.0, 24.0, 20.0, 23.0, 13.0, 16.0, 19.0, 15.0, 11.0, 11.0, 5.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50750732421875, -5.3353271484375, -5.16314697265625, -4.990966796875, -4.81878662109375, -4.6466064453125, -4.47442626953125, -4.30224609375, -4.13006591796875, -3.9578857421875, -3.78570556640625, -3.613525390625, -3.44134521484375, -3.2691650390625, -3.09698486328125, -2.9248046875, -2.75262451171875, -2.5804443359375, -2.40826416015625, -2.236083984375, -2.06390380859375, -1.8917236328125, -1.71954345703125, -1.54736328125, -1.37518310546875, -1.2030029296875, -1.03082275390625, -0.858642578125, -0.68646240234375, -0.5142822265625, -0.34210205078125, -0.169921875, 0.00225830078125, 0.1744384765625, 0.34661865234375, 0.518798828125, 0.69097900390625, 0.8631591796875, 1.03533935546875, 1.20751953125, 1.37969970703125, 1.5518798828125, 1.72406005859375, 1.896240234375, 2.06842041015625, 2.2406005859375, 2.41278076171875, 2.5849609375, 2.75714111328125, 2.9293212890625, 3.10150146484375, 3.273681640625, 3.44586181640625, 3.6180419921875, 3.79022216796875, 3.96240234375, 4.13458251953125, 4.3067626953125, 4.47894287109375, 4.651123046875, 4.82330322265625, 4.9954833984375, 5.16766357421875, 5.33984375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 4.0, 4.0, 10.0, 16.0, 17.0, 18.0, 18.0, 21.0, 40.0, 39.0, 54.0, 81.0, 115.0, 140.0, 201.0, 311.0, 513.0, 1314.0, 5655.0, 30810.0, 254706.0, 667732.0, 70710.0, 11662.0, 2338.0, 727.0, 382.0, 239.0, 157.0, 131.0, 89.0, 53.0, 46.0, 43.0, 28.0, 26.0, 23.0, 18.0, 12.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.2890625, -10.94921875, -10.609375, -10.26953125, -9.9296875, -9.58984375, -9.25, -8.91015625, -8.5703125, -8.23046875, -7.890625, -7.55078125, -7.2109375, -6.87109375, -6.53125, -6.19140625, -5.8515625, -5.51171875, -5.171875, -4.83203125, -4.4921875, -4.15234375, -3.8125, -3.47265625, -3.1328125, -2.79296875, -2.453125, -2.11328125, -1.7734375, -1.43359375, -1.09375, -0.75390625, -0.4140625, -0.07421875, 0.265625, 0.60546875, 0.9453125, 1.28515625, 1.625, 1.96484375, 2.3046875, 2.64453125, 2.984375, 3.32421875, 3.6640625, 4.00390625, 4.34375, 4.68359375, 5.0234375, 5.36328125, 5.703125, 6.04296875, 6.3828125, 6.72265625, 7.0625, 7.40234375, 7.7421875, 8.08203125, 8.421875, 8.76171875, 9.1015625, 9.44140625, 9.78125, 10.12109375, 10.4609375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 8.0, 7.0, 8.0, 7.0, 8.0, 14.0, 11.0, 16.0, 19.0, 23.0, 20.0, 14.0, 43.0, 28.0, 47.0, 43.0, 43.0, 56.0, 53.0, 198.0, 1722.0, 206.0, 62.0, 48.0, 49.0, 29.0, 41.0, 24.0, 33.0, 29.0, 22.0, 19.0, 23.0, 16.0, 20.0, 10.0, 6.0, 4.0, 4.0, 9.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890625, -19.278564453125, -18.66650390625, -18.054443359375, -17.4423828125, -16.830322265625, -16.21826171875, -15.606201171875, -14.994140625, -14.382080078125, -13.77001953125, -13.157958984375, -12.5458984375, -11.933837890625, -11.32177734375, -10.709716796875, -10.09765625, -9.485595703125, -8.87353515625, -8.261474609375, -7.6494140625, -7.037353515625, -6.42529296875, -5.813232421875, -5.201171875, -4.589111328125, -3.97705078125, -3.364990234375, -2.7529296875, -2.140869140625, -1.52880859375, -0.916748046875, -0.3046875, 0.307373046875, 0.91943359375, 1.531494140625, 2.1435546875, 2.755615234375, 3.36767578125, 3.979736328125, 4.591796875, 5.203857421875, 5.81591796875, 6.427978515625, 7.0400390625, 7.652099609375, 8.26416015625, 8.876220703125, 9.48828125, 10.100341796875, 10.71240234375, 11.324462890625, 11.9365234375, 12.548583984375, 13.16064453125, 13.772705078125, 14.384765625, 14.996826171875, 15.60888671875, 16.220947265625, 16.8330078125, 17.445068359375, 18.05712890625, 18.669189453125, 19.28125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 5.0, 5.0, 5.0, 11.0, 17.0, 22.0, 25.0, 29.0, 25.0, 43.0, 52.0, 50.0, 60.0, 121.0, 205.0, 406.0, 1088.0, 28455.0, 3104010.0, 9225.0, 816.0, 351.0, 176.0, 113.0, 91.0, 55.0, 42.0, 33.0, 29.0, 33.0, 18.0, 16.0, 14.0, 11.0, 8.0, 10.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.08251953125, -41.6650390625, -40.24755859375, -38.830078125, -37.41259765625, -35.9951171875, -34.57763671875, -33.16015625, -31.74267578125, -30.3251953125, -28.90771484375, -27.490234375, -26.07275390625, -24.6552734375, -23.23779296875, -21.8203125, -20.40283203125, -18.9853515625, -17.56787109375, -16.150390625, -14.73291015625, -13.3154296875, -11.89794921875, -10.48046875, -9.06298828125, -7.6455078125, -6.22802734375, -4.810546875, -3.39306640625, -1.9755859375, -0.55810546875, 0.859375, 2.27685546875, 3.6943359375, 5.11181640625, 6.529296875, 7.94677734375, 9.3642578125, 10.78173828125, 12.19921875, 13.61669921875, 15.0341796875, 16.45166015625, 17.869140625, 19.28662109375, 20.7041015625, 22.12158203125, 23.5390625, 24.95654296875, 26.3740234375, 27.79150390625, 29.208984375, 30.62646484375, 32.0439453125, 33.46142578125, 34.87890625, 36.29638671875, 37.7138671875, 39.13134765625, 40.548828125, 41.96630859375, 43.3837890625, 44.80126953125, 46.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 164.0, 781.0, 69.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.91584014892578, -17.040651321411133, -13.1654634475708, -9.290275573730469, -5.41508674621582, -1.5398979187011719, 2.3352890014648438, 6.210477828979492, 10.08566665649414, 13.960855484008789, 17.836044311523438, 21.711231231689453, 25.5864200592041, 29.46160888671875, 33.336795806884766, 37.21198272705078, 41.08717346191406, 44.96236038208008, 48.83755111694336, 52.712738037109375, 56.587928771972656, 60.46311569213867, 64.33830261230469, 68.21349334716797, 72.08868408203125, 75.96387481689453, 79.83905792236328, 83.71424865722656, 87.58943939208984, 91.46463012695312, 95.33981323242188, 99.21500396728516, 103.09017944335938, 106.96537017822266, 110.8405532836914, 114.71574401855469, 118.59093475341797, 122.46612548828125, 126.34130859375, 130.21649169921875, 134.09169006347656, 137.9668731689453, 141.84207153320312, 145.71725463867188, 149.59243774414062, 153.46763610839844, 157.3428192138672, 161.21800231933594, 165.09320068359375, 168.9683837890625, 172.8435821533203, 176.71876525878906, 180.5939483642578, 184.46914672851562, 188.34432983398438, 192.21951293945312, 196.09469604492188, 199.96987915039062, 203.84507751464844, 207.7202606201172, 211.59544372558594, 215.47064208984375, 219.3458251953125, 223.22100830078125, 227.09620666503906]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 9.0, 13.0, 9.0, 12.0, 11.0, 12.0, 18.0, 22.0, 33.0, 40.0, 35.0, 45.0, 37.0, 38.0, 48.0, 46.0, 38.0, 50.0, 39.0, 48.0, 32.0, 34.0, 37.0, 32.0, 38.0, 36.0, 32.0, 24.0, 21.0, 16.0, 13.0, 17.0, 14.0, 7.0, 5.0, 4.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-55.597747802734375, -54.0280876159668, -52.45842742919922, -50.88876724243164, -49.31910705566406, -47.749446868896484, -46.179786682128906, -44.61012649536133, -43.04046630859375, -41.47080612182617, -39.901145935058594, -38.331485748291016, -36.76182556152344, -35.19216537475586, -33.62250518798828, -32.0528450012207, -30.483186721801758, -28.91352653503418, -27.3438663482666, -25.774206161499023, -24.204545974731445, -22.634885787963867, -21.065227508544922, -19.495567321777344, -17.925907135009766, -16.356246948242188, -14.78658676147461, -13.216926574707031, -11.647266387939453, -10.077606201171875, -8.507946968078613, -6.938286781311035, -5.368625640869141, -3.7989654541015625, -2.2293055057525635, -0.6596455574035645, 0.9100146293640137, 2.479674816131592, 4.049334526062012, 5.61899471282959, 7.188654899597168, 8.758315086364746, 10.327975273132324, 11.897634506225586, 13.467294692993164, 15.036954879760742, 16.60661506652832, 18.1762752532959, 19.745935440063477, 21.315595626831055, 22.885255813598633, 24.45491600036621, 26.02457618713379, 27.594236373901367, 29.163894653320312, 30.73355484008789, 32.30321502685547, 33.87287521362305, 35.442535400390625, 37.0121955871582, 38.58185577392578, 40.15151596069336, 41.72117614746094, 43.290836334228516, 44.860496520996094]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 14.0, 6.0, 9.0, 9.0, 14.0, 15.0, 18.0, 18.0, 18.0, 24.0, 34.0, 34.0, 29.0, 37.0, 36.0, 40.0, 41.0, 31.0, 42.0, 27.0, 39.0, 42.0, 44.0, 37.0, 29.0, 31.0, 31.0, 33.0, 36.0, 31.0, 19.0, 17.0, 9.0, 20.0, 16.0, 6.0, 10.0, 8.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.44287109375, -5.2646484375, -5.08642578125, -4.908203125, -4.72998046875, -4.5517578125, -4.37353515625, -4.1953125, -4.01708984375, -3.8388671875, -3.66064453125, -3.482421875, -3.30419921875, -3.1259765625, -2.94775390625, -2.76953125, -2.59130859375, -2.4130859375, -2.23486328125, -2.056640625, -1.87841796875, -1.7001953125, -1.52197265625, -1.34375, -1.16552734375, -0.9873046875, -0.80908203125, -0.630859375, -0.45263671875, -0.2744140625, -0.09619140625, 0.08203125, 0.26025390625, 0.4384765625, 0.61669921875, 0.794921875, 0.97314453125, 1.1513671875, 1.32958984375, 1.5078125, 1.68603515625, 1.8642578125, 2.04248046875, 2.220703125, 2.39892578125, 2.5771484375, 2.75537109375, 2.93359375, 3.11181640625, 3.2900390625, 3.46826171875, 3.646484375, 3.82470703125, 4.0029296875, 4.18115234375, 4.359375, 4.53759765625, 4.7158203125, 4.89404296875, 5.072265625, 5.25048828125, 5.4287109375, 5.60693359375, 5.78515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 11.0, 9.0, 9.0, 7.0, 16.0, 13.0, 18.0, 29.0, 32.0, 42.0, 54.0, 97.0, 170.0, 331.0, 748.0, 2147.0, 8288.0, 54691.0, 830426.0, 2865569.0, 392151.0, 30708.0, 5633.0, 1689.0, 607.0, 278.0, 153.0, 92.0, 47.0, 56.0, 25.0, 24.0, 23.0, 16.0, 12.0, 7.0, 10.0, 9.0, 4.0, 3.0, 2.0, 7.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.0859375, -14.619873046875, -14.15380859375, -13.687744140625, -13.2216796875, -12.755615234375, -12.28955078125, -11.823486328125, -11.357421875, -10.891357421875, -10.42529296875, -9.959228515625, -9.4931640625, -9.027099609375, -8.56103515625, -8.094970703125, -7.62890625, -7.162841796875, -6.69677734375, -6.230712890625, -5.7646484375, -5.298583984375, -4.83251953125, -4.366455078125, -3.900390625, -3.434326171875, -2.96826171875, -2.502197265625, -2.0361328125, -1.570068359375, -1.10400390625, -0.637939453125, -0.171875, 0.294189453125, 0.76025390625, 1.226318359375, 1.6923828125, 2.158447265625, 2.62451171875, 3.090576171875, 3.556640625, 4.022705078125, 4.48876953125, 4.954833984375, 5.4208984375, 5.886962890625, 6.35302734375, 6.819091796875, 7.28515625, 7.751220703125, 8.21728515625, 8.683349609375, 9.1494140625, 9.615478515625, 10.08154296875, 10.547607421875, 11.013671875, 11.479736328125, 11.94580078125, 12.411865234375, 12.8779296875, 13.343994140625, 13.81005859375, 14.276123046875, 14.7421875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 11.0, 14.0, 14.0, 30.0, 23.0, 36.0, 44.0, 60.0, 81.0, 119.0, 138.0, 207.0, 263.0, 304.0, 421.0, 434.0, 408.0, 343.0, 292.0, 199.0, 146.0, 101.0, 92.0, 77.0, 51.0, 41.0, 27.0, 15.0, 13.0, 13.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.551025390625, -9.25830078125, -8.965576171875, -8.6728515625, -8.380126953125, -8.08740234375, -7.794677734375, -7.501953125, -7.209228515625, -6.91650390625, -6.623779296875, -6.3310546875, -6.038330078125, -5.74560546875, -5.452880859375, -5.16015625, -4.867431640625, -4.57470703125, -4.281982421875, -3.9892578125, -3.696533203125, -3.40380859375, -3.111083984375, -2.818359375, -2.525634765625, -2.23291015625, -1.940185546875, -1.6474609375, -1.354736328125, -1.06201171875, -0.769287109375, -0.4765625, -0.183837890625, 0.10888671875, 0.401611328125, 0.6943359375, 0.987060546875, 1.27978515625, 1.572509765625, 1.865234375, 2.157958984375, 2.45068359375, 2.743408203125, 3.0361328125, 3.328857421875, 3.62158203125, 3.914306640625, 4.20703125, 4.499755859375, 4.79248046875, 5.085205078125, 5.3779296875, 5.670654296875, 5.96337890625, 6.256103515625, 6.548828125, 6.841552734375, 7.13427734375, 7.427001953125, 7.7197265625, 8.012451171875, 8.30517578125, 8.597900390625, 8.890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 3.0, 8.0, 11.0, 15.0, 21.0, 26.0, 48.0, 63.0, 88.0, 98.0, 144.0, 206.0, 352.0, 732.0, 4715.0, 432507.0, 3735104.0, 17516.0, 1290.0, 471.0, 261.0, 170.0, 106.0, 89.0, 60.0, 57.0, 31.0, 29.0, 15.0, 13.0, 4.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.28125, -41.798828125, -40.31640625, -38.833984375, -37.3515625, -35.869140625, -34.38671875, -32.904296875, -31.421875, -29.939453125, -28.45703125, -26.974609375, -25.4921875, -24.009765625, -22.52734375, -21.044921875, -19.5625, -18.080078125, -16.59765625, -15.115234375, -13.6328125, -12.150390625, -10.66796875, -9.185546875, -7.703125, -6.220703125, -4.73828125, -3.255859375, -1.7734375, -0.291015625, 1.19140625, 2.673828125, 4.15625, 5.638671875, 7.12109375, 8.603515625, 10.0859375, 11.568359375, 13.05078125, 14.533203125, 16.015625, 17.498046875, 18.98046875, 20.462890625, 21.9453125, 23.427734375, 24.91015625, 26.392578125, 27.875, 29.357421875, 30.83984375, 32.322265625, 33.8046875, 35.287109375, 36.76953125, 38.251953125, 39.734375, 41.216796875, 42.69921875, 44.181640625, 45.6640625, 47.146484375, 48.62890625, 50.111328125, 51.59375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 13.0, 39.0, 76.0, 136.0, 173.0, 203.0, 139.0, 110.0, 59.0, 36.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.45834350585938, -71.72279357910156, -69.98724365234375, -68.2516860961914, -66.5161361694336, -64.78058624267578, -63.0450325012207, -61.30948257446289, -59.57392883300781, -57.83837890625, -56.10282516479492, -54.36727523803711, -52.63172149658203, -50.89617156982422, -49.16061782836914, -47.42506790161133, -45.68951416015625, -43.95396423339844, -42.21841049194336, -40.48286056518555, -38.74730682373047, -37.011756896972656, -35.27620315551758, -33.540653228759766, -31.805103302001953, -30.069551467895508, -28.333999633789062, -26.598447799682617, -24.862895965576172, -23.12734603881836, -21.39179229736328, -19.65624237060547, -17.92068862915039, -16.185136795043945, -14.4495849609375, -12.714033126831055, -10.97848129272461, -9.24293041229248, -7.507378578186035, -5.77182674407959, -4.0362749099731445, -2.300723075866699, -0.565171480178833, 1.1703801155090332, 2.9059319496154785, 4.641483306884766, 6.377035140991211, 8.112586975097656, 9.848138809204102, 11.583690643310547, 13.319242477416992, 15.054794311523438, 16.790346145629883, 18.525897979736328, 20.26144790649414, 21.99700164794922, 23.73255157470703, 25.468103408813477, 27.203655242919922, 28.939207077026367, 30.674758911132812, 32.410308837890625, 34.1458625793457, 35.881412506103516, 37.616966247558594]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 7.0, 12.0, 11.0, 11.0, 15.0, 14.0, 20.0, 20.0, 20.0, 27.0, 36.0, 29.0, 34.0, 35.0, 35.0, 40.0, 44.0, 49.0, 49.0, 43.0, 44.0, 42.0, 44.0, 39.0, 37.0, 34.0, 11.0, 27.0, 27.0, 25.0, 22.0, 14.0, 22.0, 19.0, 11.0, 7.0, 1.0, 5.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.78478240966797, -26.771011352539062, -25.75724220275879, -24.743471145629883, -23.72970199584961, -22.715930938720703, -21.702159881591797, -20.688390731811523, -19.67462158203125, -18.660850524902344, -17.64708137512207, -16.633310317993164, -15.61954116821289, -14.605770111083984, -13.592000007629395, -12.578229904174805, -11.564458847045898, -10.550688743591309, -9.536918640136719, -8.523147583007812, -7.509377956390381, -6.495607852935791, -5.481837272644043, -4.468067169189453, -3.4542970657348633, -2.4405269622802734, -1.4267566204071045, -0.41298627853393555, 0.6007838249206543, 1.6145539283752441, 2.628324508666992, 3.642094612121582, 4.655864715576172, 5.669634819030762, 6.683404922485352, 7.6971755027771, 8.710945129394531, 9.724716186523438, 10.738486289978027, 11.752256393432617, 12.766026496887207, 13.779796600341797, 14.793566703796387, 15.807336807250977, 16.821107864379883, 17.834877014160156, 18.848648071289062, 19.86241912841797, 20.876188278198242, 21.88995933532715, 22.903728485107422, 23.917499542236328, 24.9312686920166, 25.945039749145508, 26.95880889892578, 27.972579956054688, 28.986351013183594, 30.0001220703125, 31.013891220092773, 32.02766036987305, 33.04143142700195, 34.05520248413086, 35.068973541259766, 36.082740783691406, 37.09651184082031]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 13.0, 11.0, 23.0, 15.0, 20.0, 20.0, 22.0, 21.0, 40.0, 40.0, 40.0, 35.0, 42.0, 39.0, 43.0, 32.0, 32.0, 43.0, 36.0, 32.0, 52.0, 34.0, 35.0, 43.0, 26.0, 29.0, 20.0, 15.0, 19.0, 14.0, 16.0, 11.0, 11.0, 11.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.9410400390625, -5.749267578125, -5.5574951171875, -5.36572265625, -5.1739501953125, -4.982177734375, -4.7904052734375, -4.5986328125, -4.4068603515625, -4.215087890625, -4.0233154296875, -3.83154296875, -3.6397705078125, -3.447998046875, -3.2562255859375, -3.064453125, -2.8726806640625, -2.680908203125, -2.4891357421875, -2.29736328125, -2.1055908203125, -1.913818359375, -1.7220458984375, -1.5302734375, -1.3385009765625, -1.146728515625, -0.9549560546875, -0.76318359375, -0.5714111328125, -0.379638671875, -0.1878662109375, 0.00390625, 0.1956787109375, 0.387451171875, 0.5792236328125, 0.77099609375, 0.9627685546875, 1.154541015625, 1.3463134765625, 1.5380859375, 1.7298583984375, 1.921630859375, 2.1134033203125, 2.30517578125, 2.4969482421875, 2.688720703125, 2.8804931640625, 3.072265625, 3.2640380859375, 3.455810546875, 3.6475830078125, 3.83935546875, 4.0311279296875, 4.222900390625, 4.4146728515625, 4.6064453125, 4.7982177734375, 4.989990234375, 5.1817626953125, 5.37353515625, 5.5653076171875, 5.757080078125, 5.9488525390625, 6.140625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 5.0, 11.0, 6.0, 21.0, 23.0, 34.0, 56.0, 89.0, 99.0, 148.0, 196.0, 316.0, 455.0, 622.0, 946.0, 1322.0, 1878.0, 2712.0, 4100.0, 5902.0, 9062.0, 13616.0, 21094.0, 33239.0, 53658.0, 88902.0, 143349.0, 196758.0, 172948.0, 111615.0, 67700.0, 41399.0, 25999.0, 16603.0, 10907.0, 7288.0, 4797.0, 3336.0, 2238.0, 1559.0, 1046.0, 789.0, 506.0, 356.0, 275.0, 189.0, 113.0, 100.0, 53.0, 43.0, 36.0, 19.0, 14.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.72509765625, -0.7022476196289062, -0.6793975830078125, -0.6565475463867188, -0.633697509765625, -0.6108474731445312, -0.5879974365234375, -0.5651473999023438, -0.54229736328125, -0.5194473266601562, -0.4965972900390625, -0.47374725341796875, -0.450897216796875, -0.42804718017578125, -0.4051971435546875, -0.38234710693359375, -0.3594970703125, -0.33664703369140625, -0.3137969970703125, -0.29094696044921875, -0.268096923828125, -0.24524688720703125, -0.2223968505859375, -0.19954681396484375, -0.17669677734375, -0.15384674072265625, -0.1309967041015625, -0.10814666748046875, -0.085296630859375, -0.06244659423828125, -0.0395965576171875, -0.01674652099609375, 0.006103515625, 0.02895355224609375, 0.0518035888671875, 0.07465362548828125, 0.097503662109375, 0.12035369873046875, 0.1432037353515625, 0.16605377197265625, 0.18890380859375, 0.21175384521484375, 0.2346038818359375, 0.25745391845703125, 0.280303955078125, 0.30315399169921875, 0.3260040283203125, 0.34885406494140625, 0.3717041015625, 0.39455413818359375, 0.4174041748046875, 0.44025421142578125, 0.463104248046875, 0.48595428466796875, 0.5088043212890625, 0.5316543579101562, 0.55450439453125, 0.5773544311523438, 0.6002044677734375, 0.6230545043945312, 0.645904541015625, 0.6687545776367188, 0.6916046142578125, 0.7144546508789062, 0.7373046875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 8.0, 11.0, 9.0, 13.0, 12.0, 15.0, 16.0, 19.0, 22.0, 29.0, 41.0, 40.0, 37.0, 44.0, 40.0, 50.0, 35.0, 45.0, 1075.0, 36.0, 41.0, 37.0, 31.0, 44.0, 29.0, 31.0, 32.0, 28.0, 18.0, 23.0, 20.0, 14.0, 5.0, 8.0, 8.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.3153076171875, -3.189208984375, -3.0631103515625, -2.93701171875, -2.8109130859375, -2.684814453125, -2.5587158203125, -2.4326171875, -2.3065185546875, -2.180419921875, -2.0543212890625, -1.92822265625, -1.8021240234375, -1.676025390625, -1.5499267578125, -1.423828125, -1.2977294921875, -1.171630859375, -1.0455322265625, -0.91943359375, -0.7933349609375, -0.667236328125, -0.5411376953125, -0.4150390625, -0.2889404296875, -0.162841796875, -0.0367431640625, 0.08935546875, 0.2154541015625, 0.341552734375, 0.4676513671875, 0.59375, 0.7198486328125, 0.845947265625, 0.9720458984375, 1.09814453125, 1.2242431640625, 1.350341796875, 1.4764404296875, 1.6025390625, 1.7286376953125, 1.854736328125, 1.9808349609375, 2.10693359375, 2.2330322265625, 2.359130859375, 2.4852294921875, 2.611328125, 2.7374267578125, 2.863525390625, 2.9896240234375, 3.11572265625, 3.2418212890625, 3.367919921875, 3.4940185546875, 3.6201171875, 3.7462158203125, 3.872314453125, 3.9984130859375, 4.12451171875, 4.2506103515625, 4.376708984375, 4.5028076171875, 4.62890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 9.0, 12.0, 25.0, 24.0, 31.0, 54.0, 85.0, 139.0, 200.0, 297.0, 485.0, 823.0, 1252.0, 1875.0, 2963.0, 4738.0, 7548.0, 12423.0, 20174.0, 33448.0, 56621.0, 98612.0, 169206.0, 1268386.0, 171093.0, 100774.0, 57353.0, 34441.0, 20428.0, 12262.0, 7731.0, 4920.0, 3098.0, 2037.0, 1283.0, 772.0, 548.0, 325.0, 207.0, 135.0, 114.0, 64.0, 39.0, 21.0, 16.0, 11.0, 10.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.7119140625, -0.690673828125, -0.66943359375, -0.648193359375, -0.626953125, -0.605712890625, -0.58447265625, -0.563232421875, -0.5419921875, -0.520751953125, -0.49951171875, -0.478271484375, -0.45703125, -0.435791015625, -0.41455078125, -0.393310546875, -0.3720703125, -0.350830078125, -0.32958984375, -0.308349609375, -0.287109375, -0.265869140625, -0.24462890625, -0.223388671875, -0.2021484375, -0.180908203125, -0.15966796875, -0.138427734375, -0.1171875, -0.095947265625, -0.07470703125, -0.053466796875, -0.0322265625, -0.010986328125, 0.01025390625, 0.031494140625, 0.052734375, 0.073974609375, 0.09521484375, 0.116455078125, 0.1376953125, 0.158935546875, 0.18017578125, 0.201416015625, 0.22265625, 0.243896484375, 0.26513671875, 0.286376953125, 0.3076171875, 0.328857421875, 0.35009765625, 0.371337890625, 0.392578125, 0.413818359375, 0.43505859375, 0.456298828125, 0.4775390625, 0.498779296875, 0.52001953125, 0.541259765625, 0.5625, 0.583740234375, 0.60498046875, 0.626220703125, 0.6474609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 4.0, 8.0, 3.0, 8.0, 16.0, 26.0, 21.0, 29.0, 37.0, 67.0, 60.0, 85.0, 82.0, 82.0, 73.0, 74.0, 73.0, 51.0, 47.0, 31.0, 24.0, 20.0, 20.0, 5.0, 7.0, 12.0, 4.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026187896728515625, -0.002526789903640747, -0.0024347901344299316, -0.002342790365219116, -0.0022507905960083008, -0.0021587908267974854, -0.00206679105758667, -0.0019747912883758545, -0.001882791519165039, -0.0017907917499542236, -0.0016987919807434082, -0.0016067922115325928, -0.0015147924423217773, -0.001422792673110962, -0.0013307929039001465, -0.001238793134689331, -0.0011467933654785156, -0.0010547935962677002, -0.0009627938270568848, -0.0008707940578460693, -0.0007787942886352539, -0.0006867945194244385, -0.000594794750213623, -0.0005027949810028076, -0.0004107952117919922, -0.00031879544258117676, -0.00022679567337036133, -0.0001347959041595459, -4.279613494873047e-05, 4.920363426208496e-05, 0.0001412034034729004, 0.00023320317268371582, 0.00032520294189453125, 0.0004172027111053467, 0.0005092024803161621, 0.0006012022495269775, 0.000693202018737793, 0.0007852017879486084, 0.0008772015571594238, 0.0009692013263702393, 0.0010612010955810547, 0.0011532008647918701, 0.0012452006340026855, 0.001337200403213501, 0.0014292001724243164, 0.0015211999416351318, 0.0016131997108459473, 0.0017051994800567627, 0.0017971992492675781, 0.0018891990184783936, 0.001981198787689209, 0.0020731985569000244, 0.00216519832611084, 0.0022571980953216553, 0.0023491978645324707, 0.002441197633743286, 0.0025331974029541016, 0.002625197172164917, 0.0027171969413757324, 0.002809196710586548, 0.0029011964797973633, 0.0029931962490081787, 0.003085196018218994, 0.0031771957874298096, 0.003269195556640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 14.0, 11.0, 14.0, 15.0, 35.0, 38.0, 71.0, 82.0, 122.0, 180.0, 349.0, 940.0, 182603.0, 861744.0, 1258.0, 422.0, 213.0, 128.0, 82.0, 52.0, 37.0, 36.0, 19.0, 14.0, 17.0, 8.0, 7.0, 5.0, 2.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06676721572875977, -0.06480884552001953, -0.0628504753112793, -0.06089210510253906, -0.05893373489379883, -0.056975364685058594, -0.05501699447631836, -0.053058624267578125, -0.05110025405883789, -0.049141883850097656, -0.04718351364135742, -0.04522514343261719, -0.04326677322387695, -0.04130840301513672, -0.039350032806396484, -0.03739166259765625, -0.035433292388916016, -0.03347492218017578, -0.03151655197143555, -0.029558181762695312, -0.027599811553955078, -0.025641441345214844, -0.02368307113647461, -0.021724700927734375, -0.01976633071899414, -0.017807960510253906, -0.015849590301513672, -0.013891220092773438, -0.011932849884033203, -0.009974479675292969, -0.008016109466552734, -0.0060577392578125, -0.004099369049072266, -0.0021409988403320312, -0.00018262863159179688, 0.0017757415771484375, 0.003734111785888672, 0.005692481994628906, 0.007650852203369141, 0.009609222412109375, 0.01156759262084961, 0.013525962829589844, 0.015484333038330078, 0.017442703247070312, 0.019401073455810547, 0.02135944366455078, 0.023317813873291016, 0.02527618408203125, 0.027234554290771484, 0.02919292449951172, 0.031151294708251953, 0.03310966491699219, 0.03506803512573242, 0.037026405334472656, 0.03898477554321289, 0.040943145751953125, 0.04290151596069336, 0.044859886169433594, 0.04681825637817383, 0.04877662658691406, 0.0507349967956543, 0.05269336700439453, 0.054651737213134766, 0.056610107421875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 366.0, 651.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054013825953006744, -0.052995696663856506, -0.05197757109999657, -0.05095944181084633, -0.04994131252169609, -0.04892318695783615, -0.04790505766868591, -0.046886928379535675, -0.045868802815675735, -0.0448506735265255, -0.04383254796266556, -0.04281441867351532, -0.04179628938436508, -0.04077816382050514, -0.039760034531354904, -0.038741905242204666, -0.03772377967834473, -0.03670565038919449, -0.03568752482533455, -0.03466939553618431, -0.03365126624703407, -0.03263314068317413, -0.031615011394023895, -0.030596883967518806, -0.02957875281572342, -0.02856062538921833, -0.027542496100068092, -0.026524368673563004, -0.025506241247057915, -0.024488113820552826, -0.023469984531402588, -0.0224518571048975, -0.02143372967839241, -0.02041560225188732, -0.019397472962737083, -0.018379345536231995, -0.017361218109726906, -0.016343090683221817, -0.015324961394071579, -0.01430683396756649, -0.013288704678416252, -0.012270576320588589, -0.0112524488940835, -0.010234320536255836, -0.009216193109750748, -0.008198064751923084, -0.007179936394095421, -0.006161808501929045, -0.005143680609762669, -0.0041255527175962925, -0.0031074245925992727, -0.002089296467602253, -0.0010711685754358768, -5.304068326950073e-05, 0.0009650876745581627, 0.001983215566724539, 0.003001343458890915, 0.004019471351057291, 0.005037599243223667, 0.006055727601051331, 0.007073855493217707, 0.008091983385384083, 0.009110111743211746, 0.010128239169716835, 0.011146367527544498]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 11.0, 11.0, 11.0, 20.0, 25.0, 25.0, 40.0, 38.0, 44.0, 44.0, 51.0, 45.0, 64.0, 65.0, 64.0, 67.0, 59.0, 53.0, 54.0, 41.0, 41.0, 28.0, 24.0, 19.0, 15.0, 13.0, 8.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001131296157836914, -0.0010736426338553429, -0.0010159891098737717, -0.0009583355858922005, -0.0009006820619106293, -0.0008430285379290581, -0.0007853750139474869, -0.0007277214899659157, -0.0006700679659843445, -0.0006124144420027733, -0.0005547609180212021, -0.0004971073940396309, -0.0004394538700580597, -0.0003818003460764885, -0.0003241468220949173, -0.0002664932981133461, -0.0002088397741317749, -0.0001511862501502037, -9.353272616863251e-05, -3.587920218706131e-05, 2.1774321794509888e-05, 7.942784577608109e-05, 0.00013708136975765228, 0.00019473489373922348, 0.0002523884177207947, 0.0003100419417023659, 0.00036769546568393707, 0.00042534898966550827, 0.00048300251364707947, 0.0005406560376286507, 0.0005983095616102219, 0.0006559630855917931, 0.0007136166095733643, 0.0007712701335549355, 0.0008289236575365067, 0.0008865771815180779, 0.000944230705499649, 0.0010018842294812202, 0.0010595377534627914, 0.0011171912774443626, 0.0011748448014259338, 0.001232498325407505, 0.0012901518493890762, 0.0013478053733706474, 0.0014054588973522186, 0.0014631124213337898, 0.001520765945315361, 0.0015784194692969322, 0.0016360729932785034, 0.0016937265172600746, 0.0017513800412416458, 0.001809033565223217, 0.0018666870892047882, 0.0019243406131863594, 0.0019819941371679306, 0.002039647661149502, 0.002097301185131073, 0.002154954709112644, 0.0022126082330942154, 0.0022702617570757866, 0.002327915281057358, 0.002385568805038929, 0.0024432223290205, 0.0025008758530020714, 0.0025585293769836426]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 13.0, 11.0, 23.0, 15.0, 20.0, 20.0, 22.0, 21.0, 40.0, 40.0, 40.0, 35.0, 42.0, 39.0, 43.0, 32.0, 32.0, 43.0, 36.0, 32.0, 52.0, 34.0, 35.0, 43.0, 26.0, 29.0, 20.0, 15.0, 19.0, 14.0, 16.0, 11.0, 11.0, 11.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.9410400390625, -5.749267578125, -5.5574951171875, -5.36572265625, -5.1739501953125, -4.982177734375, -4.7904052734375, -4.5986328125, -4.4068603515625, -4.215087890625, -4.0233154296875, -3.83154296875, -3.6397705078125, -3.447998046875, -3.2562255859375, -3.064453125, -2.8726806640625, -2.680908203125, -2.4891357421875, -2.29736328125, -2.1055908203125, -1.913818359375, -1.7220458984375, -1.5302734375, -1.3385009765625, -1.146728515625, -0.9549560546875, -0.76318359375, -0.5714111328125, -0.379638671875, -0.1878662109375, 0.00390625, 0.1956787109375, 0.387451171875, 0.5792236328125, 0.77099609375, 0.9627685546875, 1.154541015625, 1.3463134765625, 1.5380859375, 1.7298583984375, 1.921630859375, 2.1134033203125, 2.30517578125, 2.4969482421875, 2.688720703125, 2.8804931640625, 3.072265625, 3.2640380859375, 3.455810546875, 3.6475830078125, 3.83935546875, 4.0311279296875, 4.222900390625, 4.4146728515625, 4.6064453125, 4.7982177734375, 4.989990234375, 5.1817626953125, 5.37353515625, 5.5653076171875, 5.757080078125, 5.9488525390625, 6.140625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 12.0, 14.0, 9.0, 15.0, 15.0, 36.0, 31.0, 47.0, 64.0, 68.0, 119.0, 146.0, 201.0, 297.0, 368.0, 495.0, 736.0, 1585.0, 5292.0, 28112.0, 505408.0, 468650.0, 27465.0, 5066.0, 1565.0, 770.0, 484.0, 389.0, 279.0, 209.0, 137.0, 121.0, 74.0, 54.0, 39.0, 37.0, 37.0, 24.0, 23.0, 17.0, 6.0, 12.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.46875, -14.9852294921875, -14.501708984375, -14.0181884765625, -13.53466796875, -13.0511474609375, -12.567626953125, -12.0841064453125, -11.6005859375, -11.1170654296875, -10.633544921875, -10.1500244140625, -9.66650390625, -9.1829833984375, -8.699462890625, -8.2159423828125, -7.732421875, -7.2489013671875, -6.765380859375, -6.2818603515625, -5.79833984375, -5.3148193359375, -4.831298828125, -4.3477783203125, -3.8642578125, -3.3807373046875, -2.897216796875, -2.4136962890625, -1.93017578125, -1.4466552734375, -0.963134765625, -0.4796142578125, 0.00390625, 0.4874267578125, 0.970947265625, 1.4544677734375, 1.93798828125, 2.4215087890625, 2.905029296875, 3.3885498046875, 3.8720703125, 4.3555908203125, 4.839111328125, 5.3226318359375, 5.80615234375, 6.2896728515625, 6.773193359375, 7.2567138671875, 7.740234375, 8.2237548828125, 8.707275390625, 9.1907958984375, 9.67431640625, 10.1578369140625, 10.641357421875, 11.1248779296875, 11.6083984375, 12.0919189453125, 12.575439453125, 13.0589599609375, 13.54248046875, 14.0260009765625, 14.509521484375, 14.9930419921875, 15.4765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 6.0, 7.0, 11.0, 8.0, 11.0, 15.0, 23.0, 15.0, 31.0, 25.0, 27.0, 32.0, 37.0, 34.0, 29.0, 52.0, 39.0, 84.0, 444.0, 1526.0, 101.0, 54.0, 45.0, 41.0, 41.0, 34.0, 32.0, 33.0, 36.0, 16.0, 22.0, 24.0, 16.0, 7.0, 16.0, 14.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.734375, -16.195068359375, -15.65576171875, -15.116455078125, -14.5771484375, -14.037841796875, -13.49853515625, -12.959228515625, -12.419921875, -11.880615234375, -11.34130859375, -10.802001953125, -10.2626953125, -9.723388671875, -9.18408203125, -8.644775390625, -8.10546875, -7.566162109375, -7.02685546875, -6.487548828125, -5.9482421875, -5.408935546875, -4.86962890625, -4.330322265625, -3.791015625, -3.251708984375, -2.71240234375, -2.173095703125, -1.6337890625, -1.094482421875, -0.55517578125, -0.015869140625, 0.5234375, 1.062744140625, 1.60205078125, 2.141357421875, 2.6806640625, 3.219970703125, 3.75927734375, 4.298583984375, 4.837890625, 5.377197265625, 5.91650390625, 6.455810546875, 6.9951171875, 7.534423828125, 8.07373046875, 8.613037109375, 9.15234375, 9.691650390625, 10.23095703125, 10.770263671875, 11.3095703125, 11.848876953125, 12.38818359375, 12.927490234375, 13.466796875, 14.006103515625, 14.54541015625, 15.084716796875, 15.6240234375, 16.163330078125, 16.70263671875, 17.241943359375, 17.78125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 8.0, 11.0, 12.0, 14.0, 14.0, 19.0, 24.0, 24.0, 24.0, 37.0, 40.0, 39.0, 58.0, 78.0, 117.0, 206.0, 443.0, 1490.0, 84206.0, 3052228.0, 5100.0, 647.0, 285.0, 133.0, 78.0, 61.0, 49.0, 37.0, 32.0, 39.0, 19.0, 22.0, 20.0, 11.0, 11.0, 10.0, 11.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-50.09375, -48.58544921875, -47.0771484375, -45.56884765625, -44.060546875, -42.55224609375, -41.0439453125, -39.53564453125, -38.02734375, -36.51904296875, -35.0107421875, -33.50244140625, -31.994140625, -30.48583984375, -28.9775390625, -27.46923828125, -25.9609375, -24.45263671875, -22.9443359375, -21.43603515625, -19.927734375, -18.41943359375, -16.9111328125, -15.40283203125, -13.89453125, -12.38623046875, -10.8779296875, -9.36962890625, -7.861328125, -6.35302734375, -4.8447265625, -3.33642578125, -1.828125, -0.31982421875, 1.1884765625, 2.69677734375, 4.205078125, 5.71337890625, 7.2216796875, 8.72998046875, 10.23828125, 11.74658203125, 13.2548828125, 14.76318359375, 16.271484375, 17.77978515625, 19.2880859375, 20.79638671875, 22.3046875, 23.81298828125, 25.3212890625, 26.82958984375, 28.337890625, 29.84619140625, 31.3544921875, 32.86279296875, 34.37109375, 35.87939453125, 37.3876953125, 38.89599609375, 40.404296875, 41.91259765625, 43.4208984375, 44.92919921875, 46.4375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 89.0, 619.0, 290.0, 15.0], "bins": [-155.8143768310547, -153.29119873046875, -150.7680206298828, -148.2448272705078, -145.72164916992188, -143.19847106933594, -140.67529296875, -138.15211486816406, -135.62893676757812, -133.1057586669922, -130.58258056640625, -128.05938720703125, -125.53620910644531, -123.01303100585938, -120.48985290527344, -117.9666748046875, -115.4434814453125, -112.92030334472656, -110.3971176147461, -107.87393951416016, -105.35075378417969, -102.82757568359375, -100.30439758300781, -97.78121948242188, -95.2580337524414, -92.73485565185547, -90.211669921875, -87.68849182128906, -85.16531372070312, -82.64212799072266, -80.11894989013672, -77.59576416015625, -75.07258605957031, -72.54940795898438, -70.0262222290039, -67.50304412841797, -64.9798583984375, -62.45668029785156, -59.933502197265625, -57.41032028198242, -54.887142181396484, -52.36396026611328, -49.840782165527344, -47.31760025024414, -44.79441833496094, -42.271236419677734, -39.74805450439453, -37.224876403808594, -34.70169448852539, -32.17851257324219, -29.655332565307617, -27.132152557373047, -24.608970642089844, -22.08578872680664, -19.56260871887207, -17.0394287109375, -14.516246795654297, -11.99306583404541, -9.469884872436523, -6.946703910827637, -4.42352294921875, -1.9003419876098633, 0.6228389739990234, 3.1460189819335938, 5.669201374053955]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 8.0, 8.0, 11.0, 15.0, 13.0, 17.0, 27.0, 24.0, 31.0, 39.0, 34.0, 43.0, 51.0, 55.0, 50.0, 51.0, 50.0, 51.0, 28.0, 46.0, 41.0, 47.0, 39.0, 27.0, 37.0, 29.0, 24.0, 15.0, 17.0, 14.0, 14.0, 10.0, 4.0, 5.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.079185485839844, -51.39681625366211, -49.71445083618164, -48.032081604003906, -46.34971237182617, -44.66734313964844, -42.98497772216797, -41.302608489990234, -39.6202392578125, -37.937870025634766, -36.2555046081543, -34.57313537597656, -32.89076614379883, -31.208398818969727, -29.526031494140625, -27.84366226196289, -26.16129493713379, -24.478927612304688, -22.796558380126953, -21.11419105529785, -19.431821823120117, -17.749454498291016, -16.06708526611328, -14.38471794128418, -12.702349662780762, -11.019981384277344, -9.337613105773926, -7.655245304107666, -5.972877025604248, -4.290509223937988, -2.6081409454345703, -0.9257726669311523, 0.7565956115722656, 2.4389638900756836, 4.121332168579102, 5.803699970245361, 7.486068248748779, 9.168436050415039, 10.850804328918457, 12.533172607421875, 14.215540885925293, 15.897909164428711, 17.580276489257812, 19.262645721435547, 20.94501304626465, 22.62738037109375, 24.309749603271484, 25.99211883544922, 27.67448616027832, 29.356853485107422, 31.039222717285156, 32.72159194946289, 34.40395736694336, 36.086326599121094, 37.76869583129883, 39.45106506347656, 41.13343048095703, 42.815799713134766, 44.498165130615234, 46.18053436279297, 47.8629035949707, 49.54527282714844, 51.227638244628906, 52.91000747680664, 54.592376708984375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 6.0, 7.0, 10.0, 12.0, 8.0, 18.0, 21.0, 13.0, 30.0, 18.0, 28.0, 31.0, 33.0, 29.0, 34.0, 34.0, 36.0, 43.0, 43.0, 34.0, 38.0, 39.0, 33.0, 40.0, 33.0, 41.0, 42.0, 25.0, 27.0, 30.0, 22.0, 17.0, 10.0, 22.0, 13.0, 10.0, 9.0, 14.0, 8.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.55059814453125, -5.3629150390625, -5.17523193359375, -4.987548828125, -4.79986572265625, -4.6121826171875, -4.42449951171875, -4.23681640625, -4.04913330078125, -3.8614501953125, -3.67376708984375, -3.486083984375, -3.29840087890625, -3.1107177734375, -2.92303466796875, -2.7353515625, -2.54766845703125, -2.3599853515625, -2.17230224609375, -1.984619140625, -1.79693603515625, -1.6092529296875, -1.42156982421875, -1.23388671875, -1.04620361328125, -0.8585205078125, -0.67083740234375, -0.483154296875, -0.29547119140625, -0.1077880859375, 0.07989501953125, 0.267578125, 0.45526123046875, 0.6429443359375, 0.83062744140625, 1.018310546875, 1.20599365234375, 1.3936767578125, 1.58135986328125, 1.76904296875, 1.95672607421875, 2.1444091796875, 2.33209228515625, 2.519775390625, 2.70745849609375, 2.8951416015625, 3.08282470703125, 3.2705078125, 3.45819091796875, 3.6458740234375, 3.83355712890625, 4.021240234375, 4.20892333984375, 4.3966064453125, 4.58428955078125, 4.77197265625, 4.95965576171875, 5.1473388671875, 5.33502197265625, 5.522705078125, 5.71038818359375, 5.8980712890625, 6.08575439453125, 6.2734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 8.0, 10.0, 8.0, 12.0, 14.0, 24.0, 34.0, 40.0, 55.0, 68.0, 83.0, 109.0, 169.0, 247.0, 363.0, 575.0, 988.0, 1994.0, 4455.0, 12646.0, 55269.0, 477440.0, 2410576.0, 1078947.0, 117347.0, 20490.0, 6321.0, 2597.0, 1285.0, 641.0, 446.0, 291.0, 159.0, 134.0, 101.0, 74.0, 50.0, 42.0, 37.0, 29.0, 26.0, 17.0, 12.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.515625, -11.140380859375, -10.76513671875, -10.389892578125, -10.0146484375, -9.639404296875, -9.26416015625, -8.888916015625, -8.513671875, -8.138427734375, -7.76318359375, -7.387939453125, -7.0126953125, -6.637451171875, -6.26220703125, -5.886962890625, -5.51171875, -5.136474609375, -4.76123046875, -4.385986328125, -4.0107421875, -3.635498046875, -3.26025390625, -2.885009765625, -2.509765625, -2.134521484375, -1.75927734375, -1.384033203125, -1.0087890625, -0.633544921875, -0.25830078125, 0.116943359375, 0.4921875, 0.867431640625, 1.24267578125, 1.617919921875, 1.9931640625, 2.368408203125, 2.74365234375, 3.118896484375, 3.494140625, 3.869384765625, 4.24462890625, 4.619873046875, 4.9951171875, 5.370361328125, 5.74560546875, 6.120849609375, 6.49609375, 6.871337890625, 7.24658203125, 7.621826171875, 7.9970703125, 8.372314453125, 8.74755859375, 9.122802734375, 9.498046875, 9.873291015625, 10.24853515625, 10.623779296875, 10.9990234375, 11.374267578125, 11.74951171875, 12.124755859375, 12.5]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 12.0, 9.0, 15.0, 37.0, 51.0, 85.0, 127.0, 204.0, 330.0, 524.0, 770.0, 698.0, 473.0, 283.0, 166.0, 124.0, 58.0, 45.0, 23.0, 16.0, 10.0, 6.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.317138671875, -11.82177734375, -11.326416015625, -10.8310546875, -10.335693359375, -9.84033203125, -9.344970703125, -8.849609375, -8.354248046875, -7.85888671875, -7.363525390625, -6.8681640625, -6.372802734375, -5.87744140625, -5.382080078125, -4.88671875, -4.391357421875, -3.89599609375, -3.400634765625, -2.9052734375, -2.409912109375, -1.91455078125, -1.419189453125, -0.923828125, -0.428466796875, 0.06689453125, 0.562255859375, 1.0576171875, 1.552978515625, 2.04833984375, 2.543701171875, 3.0390625, 3.534423828125, 4.02978515625, 4.525146484375, 5.0205078125, 5.515869140625, 6.01123046875, 6.506591796875, 7.001953125, 7.497314453125, 7.99267578125, 8.488037109375, 8.9833984375, 9.478759765625, 9.97412109375, 10.469482421875, 10.96484375, 11.460205078125, 11.95556640625, 12.450927734375, 12.9462890625, 13.441650390625, 13.93701171875, 14.432373046875, 14.927734375, 15.423095703125, 15.91845703125, 16.413818359375, 16.9091796875, 17.404541015625, 17.89990234375, 18.395263671875, 18.890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 8.0, 7.0, 12.0, 15.0, 28.0, 33.0, 38.0, 85.0, 101.0, 138.0, 211.0, 357.0, 1047.0, 5324.0, 153336.0, 3960594.0, 67407.0, 3640.0, 856.0, 355.0, 200.0, 147.0, 91.0, 74.0, 42.0, 44.0, 30.0, 22.0, 12.0, 9.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-50.65625, -49.33740234375, -48.0185546875, -46.69970703125, -45.380859375, -44.06201171875, -42.7431640625, -41.42431640625, -40.10546875, -38.78662109375, -37.4677734375, -36.14892578125, -34.830078125, -33.51123046875, -32.1923828125, -30.87353515625, -29.5546875, -28.23583984375, -26.9169921875, -25.59814453125, -24.279296875, -22.96044921875, -21.6416015625, -20.32275390625, -19.00390625, -17.68505859375, -16.3662109375, -15.04736328125, -13.728515625, -12.40966796875, -11.0908203125, -9.77197265625, -8.453125, -7.13427734375, -5.8154296875, -4.49658203125, -3.177734375, -1.85888671875, -0.5400390625, 0.77880859375, 2.09765625, 3.41650390625, 4.7353515625, 6.05419921875, 7.373046875, 8.69189453125, 10.0107421875, 11.32958984375, 12.6484375, 13.96728515625, 15.2861328125, 16.60498046875, 17.923828125, 19.24267578125, 20.5615234375, 21.88037109375, 23.19921875, 24.51806640625, 25.8369140625, 27.15576171875, 28.474609375, 29.79345703125, 31.1123046875, 32.43115234375, 33.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 22.0, 116.0, 324.0, 368.0, 138.0, 37.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.95913696289062, -206.14895629882812, -202.33877563476562, -198.52859497070312, -194.7184295654297, -190.9082489013672, -187.0980682373047, -183.2878875732422, -179.4777069091797, -175.6675262451172, -171.8573455810547, -168.04718017578125, -164.23699951171875, -160.42681884765625, -156.61663818359375, -152.80645751953125, -148.99627685546875, -145.18609619140625, -141.37591552734375, -137.56573486328125, -133.7555694580078, -129.9453887939453, -126.13520812988281, -122.32502746582031, -118.51486206054688, -114.70468139648438, -110.8945083618164, -107.0843276977539, -103.2741470336914, -99.46397399902344, -95.65379333496094, -91.84361267089844, -88.0334243774414, -84.2232437133789, -80.41307067871094, -76.60289001464844, -72.79270935058594, -68.98252868652344, -65.17235565185547, -61.36217498779297, -57.551998138427734, -53.7418212890625, -49.931640625, -46.121463775634766, -42.31128692626953, -38.50110626220703, -34.6909294128418, -30.88075065612793, -27.070571899414062, -23.260393142700195, -19.450214385986328, -15.640037536621094, -11.829858779907227, -8.01968002319336, -4.209503173828125, -0.3993244171142578, 3.4108543395996094, 7.221032619476318, 11.031210899353027, 14.841388702392578, 18.651567459106445, 22.461746215820312, 26.271923065185547, 30.082101821899414, 33.89228057861328]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 11.0, 19.0, 16.0, 18.0, 32.0, 21.0, 20.0, 28.0, 29.0, 40.0, 28.0, 38.0, 41.0, 44.0, 40.0, 31.0, 40.0, 29.0, 43.0, 35.0, 36.0, 43.0, 40.0, 35.0, 32.0, 31.0, 29.0, 19.0, 16.0, 23.0, 7.0, 14.0, 9.0, 10.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-31.353004455566406, -30.33247184753418, -29.311941146850586, -28.29140853881836, -27.270875930786133, -26.250343322753906, -25.229812622070312, -24.209280014038086, -23.18874740600586, -22.168214797973633, -21.14768409729004, -20.127151489257812, -19.106618881225586, -18.08608627319336, -17.065555572509766, -16.04502296447754, -15.024492263793945, -14.003960609436035, -12.983428001403809, -11.962896347045898, -10.942363739013672, -9.921832084655762, -8.901300430297852, -7.880768299102783, -6.860236167907715, -5.8397040367126465, -4.819171905517578, -3.798640251159668, -2.7781081199645996, -1.7575759887695312, -0.7370443344116211, 0.28348779678344727, 1.3040199279785156, 2.324552059173584, 3.3450839519500732, 4.3656158447265625, 5.386147975921631, 6.406680107116699, 7.427211761474609, 8.447744369506836, 9.468276023864746, 10.488807678222656, 11.509340286254883, 12.529871940612793, 13.550403594970703, 14.57093620300293, 15.59146785736084, 16.61199951171875, 17.632532119750977, 18.653064727783203, 19.673595428466797, 20.694128036499023, 21.71466064453125, 22.735191345214844, 23.75572395324707, 24.776256561279297, 25.79678726196289, 26.817319869995117, 27.83785057067871, 28.858383178710938, 29.878915786743164, 30.89944839477539, 31.919979095458984, 32.94050979614258, 33.96104431152344]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 6.0, 8.0, 8.0, 7.0, 17.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 26.0, 40.0, 37.0, 26.0, 31.0, 32.0, 34.0, 48.0, 52.0, 34.0, 34.0, 33.0, 33.0, 38.0, 35.0, 21.0, 30.0, 30.0, 28.0, 20.0, 24.0, 26.0, 12.0, 12.0, 16.0, 20.0, 9.0, 6.0, 5.0, 6.0, 9.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.27044677734375, -5.0838623046875, -4.89727783203125, -4.710693359375, -4.52410888671875, -4.3375244140625, -4.15093994140625, -3.96435546875, -3.77777099609375, -3.5911865234375, -3.40460205078125, -3.218017578125, -3.03143310546875, -2.8448486328125, -2.65826416015625, -2.4716796875, -2.28509521484375, -2.0985107421875, -1.91192626953125, -1.725341796875, -1.53875732421875, -1.3521728515625, -1.16558837890625, -0.97900390625, -0.79241943359375, -0.6058349609375, -0.41925048828125, -0.232666015625, -0.04608154296875, 0.1405029296875, 0.32708740234375, 0.513671875, 0.70025634765625, 0.8868408203125, 1.07342529296875, 1.260009765625, 1.44659423828125, 1.6331787109375, 1.81976318359375, 2.00634765625, 2.19293212890625, 2.3795166015625, 2.56610107421875, 2.752685546875, 2.93927001953125, 3.1258544921875, 3.31243896484375, 3.4990234375, 3.68560791015625, 3.8721923828125, 4.05877685546875, 4.245361328125, 4.43194580078125, 4.6185302734375, 4.80511474609375, 4.99169921875, 5.17828369140625, 5.3648681640625, 5.55145263671875, 5.738037109375, 5.92462158203125, 6.1112060546875, 6.29779052734375, 6.484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 7.0, 7.0, 20.0, 22.0, 25.0, 43.0, 56.0, 80.0, 108.0, 171.0, 234.0, 318.0, 407.0, 634.0, 806.0, 1071.0, 1497.0, 2147.0, 2800.0, 3999.0, 5301.0, 7361.0, 10102.0, 14267.0, 19917.0, 28532.0, 41355.0, 61103.0, 91951.0, 133345.0, 163429.0, 141535.0, 99005.0, 66043.0, 43882.0, 30687.0, 21282.0, 15326.0, 10950.0, 7771.0, 5585.0, 4157.0, 3108.0, 2230.0, 1577.0, 1187.0, 876.0, 642.0, 484.0, 335.0, 227.0, 171.0, 111.0, 94.0, 57.0, 54.0, 26.0, 20.0, 12.0, 8.0, 7.0, 3.0, 3.0], "bins": [-0.60888671875, -0.5896148681640625, -0.570343017578125, -0.5510711669921875, -0.53179931640625, -0.5125274658203125, -0.493255615234375, -0.4739837646484375, -0.4547119140625, -0.4354400634765625, -0.416168212890625, -0.3968963623046875, -0.37762451171875, -0.3583526611328125, -0.339080810546875, -0.3198089599609375, -0.300537109375, -0.2812652587890625, -0.261993408203125, -0.2427215576171875, -0.22344970703125, -0.2041778564453125, -0.184906005859375, -0.1656341552734375, -0.1463623046875, -0.1270904541015625, -0.107818603515625, -0.0885467529296875, -0.06927490234375, -0.0500030517578125, -0.030731201171875, -0.0114593505859375, 0.0078125, 0.0270843505859375, 0.046356201171875, 0.0656280517578125, 0.08489990234375, 0.1041717529296875, 0.123443603515625, 0.1427154541015625, 0.1619873046875, 0.1812591552734375, 0.200531005859375, 0.2198028564453125, 0.23907470703125, 0.2583465576171875, 0.277618408203125, 0.2968902587890625, 0.316162109375, 0.3354339599609375, 0.354705810546875, 0.3739776611328125, 0.39324951171875, 0.4125213623046875, 0.431793212890625, 0.4510650634765625, 0.4703369140625, 0.4896087646484375, 0.508880615234375, 0.5281524658203125, 0.54742431640625, 0.5666961669921875, 0.585968017578125, 0.6052398681640625, 0.62451171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 12.0, 14.0, 16.0, 11.0, 22.0, 35.0, 25.0, 28.0, 38.0, 31.0, 32.0, 30.0, 30.0, 38.0, 28.0, 43.0, 1067.0, 38.0, 25.0, 40.0, 35.0, 27.0, 42.0, 33.0, 31.0, 28.0, 19.0, 19.0, 19.0, 13.0, 15.0, 15.0, 12.0, 13.0, 13.0, 8.0, 8.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.26171875, -4.13787841796875, -4.0140380859375, -3.89019775390625, -3.766357421875, -3.64251708984375, -3.5186767578125, -3.39483642578125, -3.27099609375, -3.14715576171875, -3.0233154296875, -2.89947509765625, -2.775634765625, -2.65179443359375, -2.5279541015625, -2.40411376953125, -2.2802734375, -2.15643310546875, -2.0325927734375, -1.90875244140625, -1.784912109375, -1.66107177734375, -1.5372314453125, -1.41339111328125, -1.28955078125, -1.16571044921875, -1.0418701171875, -0.91802978515625, -0.794189453125, -0.67034912109375, -0.5465087890625, -0.42266845703125, -0.298828125, -0.17498779296875, -0.0511474609375, 0.07269287109375, 0.196533203125, 0.32037353515625, 0.4442138671875, 0.56805419921875, 0.69189453125, 0.81573486328125, 0.9395751953125, 1.06341552734375, 1.187255859375, 1.31109619140625, 1.4349365234375, 1.55877685546875, 1.6826171875, 1.80645751953125, 1.9302978515625, 2.05413818359375, 2.177978515625, 2.30181884765625, 2.4256591796875, 2.54949951171875, 2.67333984375, 2.79718017578125, 2.9210205078125, 3.04486083984375, 3.168701171875, 3.29254150390625, 3.4163818359375, 3.54022216796875, 3.6640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 17.0, 21.0, 37.0, 61.0, 89.0, 124.0, 183.0, 264.0, 431.0, 647.0, 934.0, 1583.0, 2535.0, 4115.0, 6734.0, 11350.0, 19119.0, 32732.0, 57040.0, 102086.0, 179617.0, 1283590.0, 169082.0, 95050.0, 53464.0, 30684.0, 17941.0, 10523.0, 6415.0, 3942.0, 2518.0, 1529.0, 980.0, 584.0, 376.0, 243.0, 174.0, 109.0, 62.0, 31.0, 34.0, 18.0, 16.0, 5.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.7041015625, -0.6801834106445312, -0.6562652587890625, -0.6323471069335938, -0.608428955078125, -0.5845108032226562, -0.5605926513671875, -0.5366744995117188, -0.51275634765625, -0.48883819580078125, -0.4649200439453125, -0.44100189208984375, -0.417083740234375, -0.39316558837890625, -0.3692474365234375, -0.34532928466796875, -0.3214111328125, -0.29749298095703125, -0.2735748291015625, -0.24965667724609375, -0.225738525390625, -0.20182037353515625, -0.1779022216796875, -0.15398406982421875, -0.13006591796875, -0.10614776611328125, -0.0822296142578125, -0.05831146240234375, -0.034393310546875, -0.01047515869140625, 0.0134429931640625, 0.03736114501953125, 0.061279296875, 0.08519744873046875, 0.1091156005859375, 0.13303375244140625, 0.156951904296875, 0.18087005615234375, 0.2047882080078125, 0.22870635986328125, 0.25262451171875, 0.27654266357421875, 0.3004608154296875, 0.32437896728515625, 0.348297119140625, 0.37221527099609375, 0.3961334228515625, 0.42005157470703125, 0.4439697265625, 0.46788787841796875, 0.4918060302734375, 0.5157241821289062, 0.539642333984375, 0.5635604858398438, 0.5874786376953125, 0.6113967895507812, 0.63531494140625, 0.6592330932617188, 0.6831512451171875, 0.7070693969726562, 0.730987548828125, 0.7549057006835938, 0.7788238525390625, 0.8027420043945312, 0.82666015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 11.0, 5.0, 4.0, 7.0, 15.0, 18.0, 29.0, 26.0, 32.0, 21.0, 32.0, 60.0, 41.0, 66.0, 58.0, 56.0, 64.0, 53.0, 52.0, 59.0, 36.0, 42.0, 31.0, 29.0, 41.0, 26.0, 22.0, 14.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0027141571044921875, -0.002634882926940918, -0.0025556087493896484, -0.002476334571838379, -0.0023970603942871094, -0.00231778621673584, -0.0022385120391845703, -0.0021592378616333008, -0.0020799636840820312, -0.0020006895065307617, -0.0019214153289794922, -0.0018421411514282227, -0.0017628669738769531, -0.0016835927963256836, -0.001604318618774414, -0.0015250444412231445, -0.001445770263671875, -0.0013664960861206055, -0.001287221908569336, -0.0012079477310180664, -0.0011286735534667969, -0.0010493993759155273, -0.0009701251983642578, -0.0008908510208129883, -0.0008115768432617188, -0.0007323026657104492, -0.0006530284881591797, -0.0005737543106079102, -0.0004944801330566406, -0.0004152059555053711, -0.00033593177795410156, -0.00025665760040283203, -0.0001773834228515625, -9.810924530029297e-05, -1.8835067749023438e-05, 6.0439109802246094e-05, 0.00013971328735351562, 0.00021898746490478516, 0.0002982616424560547, 0.0003775358200073242, 0.00045680999755859375, 0.0005360841751098633, 0.0006153583526611328, 0.0006946325302124023, 0.0007739067077636719, 0.0008531808853149414, 0.0009324550628662109, 0.0010117292404174805, 0.00109100341796875, 0.0011702775955200195, 0.001249551773071289, 0.0013288259506225586, 0.0014081001281738281, 0.0014873743057250977, 0.0015666484832763672, 0.0016459226608276367, 0.0017251968383789062, 0.0018044710159301758, 0.0018837451934814453, 0.001963019371032715, 0.0020422935485839844, 0.002121567726135254, 0.0022008419036865234, 0.002280116081237793, 0.0023593902587890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 6.0, 15.0, 27.0, 27.0, 34.0, 46.0, 76.0, 82.0, 77.0, 126.0, 174.0, 318.0, 609.0, 2237.0, 859854.0, 182102.0, 1234.0, 498.0, 280.0, 176.0, 118.0, 98.0, 69.0, 50.0, 39.0, 24.0, 37.0, 21.0, 14.0, 13.0, 12.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.04671478271484375, -0.0451507568359375, -0.04358673095703125, -0.042022705078125, -0.04045867919921875, -0.0388946533203125, -0.03733062744140625, -0.0357666015625, -0.03420257568359375, -0.0326385498046875, -0.03107452392578125, -0.029510498046875, -0.02794647216796875, -0.0263824462890625, -0.02481842041015625, -0.02325439453125, -0.02169036865234375, -0.0201263427734375, -0.01856231689453125, -0.016998291015625, -0.01543426513671875, -0.0138702392578125, -0.01230621337890625, -0.0107421875, -0.00917816162109375, -0.0076141357421875, -0.00605010986328125, -0.004486083984375, -0.00292205810546875, -0.0013580322265625, 0.00020599365234375, 0.00177001953125, 0.00333404541015625, 0.0048980712890625, 0.00646209716796875, 0.008026123046875, 0.00959014892578125, 0.0111541748046875, 0.01271820068359375, 0.0142822265625, 0.01584625244140625, 0.0174102783203125, 0.01897430419921875, 0.020538330078125, 0.02210235595703125, 0.0236663818359375, 0.02523040771484375, 0.02679443359375, 0.02835845947265625, 0.0299224853515625, 0.03148651123046875, 0.033050537109375, 0.03461456298828125, 0.0361785888671875, 0.03774261474609375, 0.039306640625, 0.04087066650390625, 0.0424346923828125, 0.04399871826171875, 0.045562744140625, 0.04712677001953125, 0.0486907958984375, 0.05025482177734375, 0.05181884765625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 981.0, 32.0], "bins": [-0.057560306042432785, -0.056641124188899994, -0.0557219460606575, -0.05480276420712471, -0.05388358607888222, -0.052964404225349426, -0.052045226097106934, -0.05112604424357414, -0.05020686611533165, -0.04928768426179886, -0.048368506133556366, -0.047449324280023575, -0.04653014615178108, -0.04561096429824829, -0.0446917861700058, -0.04377260431647301, -0.042853426188230515, -0.04193424433469772, -0.04101506620645523, -0.04009588435292244, -0.03917670622467995, -0.038257524371147156, -0.03733834624290466, -0.03641916438937187, -0.03549998626112938, -0.03458080440759659, -0.033661626279354095, -0.032742444425821304, -0.03182326629757881, -0.03090408630669117, -0.029984906315803528, -0.029065726324915886, -0.028146542608737946, -0.027227362617850304, -0.026308182626962662, -0.02538900263607502, -0.024469822645187378, -0.023550642654299736, -0.022631462663412094, -0.021712282672524452, -0.02079310268163681, -0.01987392269074917, -0.018954742699861526, -0.018035562708973885, -0.017116382718086243, -0.0161972027271986, -0.015278022736310959, -0.014358842745423317, -0.0134396618232131, -0.012520481832325459, -0.011601301841437817, -0.010682121850550175, -0.009762941859662533, -0.008843760937452316, -0.007924580946564674, -0.00700540142133832, -0.006086221896111965, -0.005167041905224323, -0.004247861914336681, -0.003328681690618396, -0.002409501699730754, -0.0014903214760124683, -0.0005711414851248264, 0.0003480385057628155, 0.0012672186130657792]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 9.0, 17.0, 29.0, 31.0, 29.0, 45.0, 41.0, 61.0, 76.0, 59.0, 79.0, 89.0, 67.0, 80.0, 72.0, 67.0, 34.0, 32.0, 23.0, 26.0, 18.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014080405235290527, -0.0013303542509675026, -0.0012526679784059525, -0.0011749817058444023, -0.0010972954332828522, -0.001019609160721302, -0.0009419228881597519, -0.0008642366155982018, -0.0007865503430366516, -0.0007088640704751015, -0.0006311777979135513, -0.0005534915253520012, -0.00047580525279045105, -0.0003981189802289009, -0.00032043270766735077, -0.00024274643510580063, -0.0001650601625442505, -8.737388998270035e-05, -9.687617421150208e-06, 6.799865514039993e-05, 0.00014568492770195007, 0.00022337120026350021, 0.00030105747282505035, 0.0003787437453866005, 0.00045643001794815063, 0.0005341162905097008, 0.0006118025630712509, 0.0006894888356328011, 0.0007671751081943512, 0.0008448613807559013, 0.0009225476533174515, 0.0010002339258790016, 0.0010779201984405518, 0.001155606471002102, 0.001233292743563652, 0.0013109790161252022, 0.0013886652886867523, 0.0014663515612483025, 0.0015440378338098526, 0.0016217241063714027, 0.0016994103789329529, 0.001777096651494503, 0.0018547829240560532, 0.0019324691966176033, 0.0020101554691791534, 0.0020878417417407036, 0.0021655280143022537, 0.002243214286863804, 0.002320900559425354, 0.002398586831986904, 0.0024762731045484543, 0.0025539593771100044, 0.0026316456496715546, 0.0027093319222331047, 0.002787018194794655, 0.002864704467356205, 0.002942390739917755, 0.0030200770124793053, 0.0030977632850408554, 0.0031754495576024055, 0.0032531358301639557, 0.003330822102725506, 0.003408508375287056, 0.003486194647848606, 0.0035638809204101562]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 6.0, 8.0, 7.0, 8.0, 17.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 26.0, 40.0, 37.0, 26.0, 31.0, 32.0, 34.0, 47.0, 53.0, 34.0, 34.0, 33.0, 33.0, 38.0, 35.0, 21.0, 30.0, 30.0, 28.0, 20.0, 24.0, 26.0, 12.0, 12.0, 16.0, 20.0, 9.0, 6.0, 5.0, 6.0, 9.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.27044677734375, -5.0838623046875, -4.89727783203125, -4.710693359375, -4.52410888671875, -4.3375244140625, -4.15093994140625, -3.96435546875, -3.77777099609375, -3.5911865234375, -3.40460205078125, -3.218017578125, -3.03143310546875, -2.8448486328125, -2.65826416015625, -2.4716796875, -2.28509521484375, -2.0985107421875, -1.91192626953125, -1.725341796875, -1.53875732421875, -1.3521728515625, -1.16558837890625, -0.97900390625, -0.79241943359375, -0.6058349609375, -0.41925048828125, -0.232666015625, -0.04608154296875, 0.1405029296875, 0.32708740234375, 0.513671875, 0.70025634765625, 0.8868408203125, 1.07342529296875, 1.260009765625, 1.44659423828125, 1.6331787109375, 1.81976318359375, 2.00634765625, 2.19293212890625, 2.3795166015625, 2.56610107421875, 2.752685546875, 2.93927001953125, 3.1258544921875, 3.31243896484375, 3.4990234375, 3.68560791015625, 3.8721923828125, 4.05877685546875, 4.245361328125, 4.43194580078125, 4.6185302734375, 4.80511474609375, 4.99169921875, 5.17828369140625, 5.3648681640625, 5.55145263671875, 5.738037109375, 5.92462158203125, 6.1112060546875, 6.29779052734375, 6.484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 12.0, 16.0, 17.0, 24.0, 26.0, 32.0, 48.0, 41.0, 69.0, 83.0, 113.0, 157.0, 275.0, 392.0, 700.0, 1315.0, 2563.0, 5607.0, 12830.0, 31776.0, 88536.0, 303733.0, 410432.0, 118732.0, 41176.0, 16071.0, 6819.0, 3154.0, 1491.0, 794.0, 494.0, 275.0, 178.0, 144.0, 107.0, 66.0, 55.0, 33.0, 41.0, 27.0, 14.0, 17.0, 12.0, 12.0, 5.0, 10.0, 6.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.95703125, -6.71820068359375, -6.4793701171875, -6.24053955078125, -6.001708984375, -5.76287841796875, -5.5240478515625, -5.28521728515625, -5.04638671875, -4.80755615234375, -4.5687255859375, -4.32989501953125, -4.091064453125, -3.85223388671875, -3.6134033203125, -3.37457275390625, -3.1357421875, -2.89691162109375, -2.6580810546875, -2.41925048828125, -2.180419921875, -1.94158935546875, -1.7027587890625, -1.46392822265625, -1.22509765625, -0.98626708984375, -0.7474365234375, -0.50860595703125, -0.269775390625, -0.03094482421875, 0.2078857421875, 0.44671630859375, 0.685546875, 0.92437744140625, 1.1632080078125, 1.40203857421875, 1.640869140625, 1.87969970703125, 2.1185302734375, 2.35736083984375, 2.59619140625, 2.83502197265625, 3.0738525390625, 3.31268310546875, 3.551513671875, 3.79034423828125, 4.0291748046875, 4.26800537109375, 4.5068359375, 4.74566650390625, 4.9844970703125, 5.22332763671875, 5.462158203125, 5.70098876953125, 5.9398193359375, 6.17864990234375, 6.41748046875, 6.65631103515625, 6.8951416015625, 7.13397216796875, 7.372802734375, 7.61163330078125, 7.8504638671875, 8.08929443359375, 8.328125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 5.0, 7.0, 16.0, 14.0, 7.0, 20.0, 19.0, 20.0, 14.0, 32.0, 35.0, 29.0, 42.0, 41.0, 44.0, 51.0, 75.0, 111.0, 313.0, 1510.0, 147.0, 86.0, 76.0, 49.0, 37.0, 42.0, 26.0, 20.0, 24.0, 17.0, 23.0, 18.0, 7.0, 16.0, 8.0, 7.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.23583984375, -15.6591796875, -15.08251953125, -14.505859375, -13.92919921875, -13.3525390625, -12.77587890625, -12.19921875, -11.62255859375, -11.0458984375, -10.46923828125, -9.892578125, -9.31591796875, -8.7392578125, -8.16259765625, -7.5859375, -7.00927734375, -6.4326171875, -5.85595703125, -5.279296875, -4.70263671875, -4.1259765625, -3.54931640625, -2.97265625, -2.39599609375, -1.8193359375, -1.24267578125, -0.666015625, -0.08935546875, 0.4873046875, 1.06396484375, 1.640625, 2.21728515625, 2.7939453125, 3.37060546875, 3.947265625, 4.52392578125, 5.1005859375, 5.67724609375, 6.25390625, 6.83056640625, 7.4072265625, 7.98388671875, 8.560546875, 9.13720703125, 9.7138671875, 10.29052734375, 10.8671875, 11.44384765625, 12.0205078125, 12.59716796875, 13.173828125, 13.75048828125, 14.3271484375, 14.90380859375, 15.48046875, 16.05712890625, 16.6337890625, 17.21044921875, 17.787109375, 18.36376953125, 18.9404296875, 19.51708984375, 20.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 9.0, 7.0, 10.0, 16.0, 23.0, 39.0, 29.0, 52.0, 95.0, 131.0, 198.0, 364.0, 793.0, 6256.0, 583838.0, 2540141.0, 11527.0, 1013.0, 421.0, 258.0, 155.0, 89.0, 63.0, 59.0, 28.0, 25.0, 17.0, 20.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.4375, -29.27099609375, -28.1044921875, -26.93798828125, -25.771484375, -24.60498046875, -23.4384765625, -22.27197265625, -21.10546875, -19.93896484375, -18.7724609375, -17.60595703125, -16.439453125, -15.27294921875, -14.1064453125, -12.93994140625, -11.7734375, -10.60693359375, -9.4404296875, -8.27392578125, -7.107421875, -5.94091796875, -4.7744140625, -3.60791015625, -2.44140625, -1.27490234375, -0.1083984375, 1.05810546875, 2.224609375, 3.39111328125, 4.5576171875, 5.72412109375, 6.890625, 8.05712890625, 9.2236328125, 10.39013671875, 11.556640625, 12.72314453125, 13.8896484375, 15.05615234375, 16.22265625, 17.38916015625, 18.5556640625, 19.72216796875, 20.888671875, 22.05517578125, 23.2216796875, 24.38818359375, 25.5546875, 26.72119140625, 27.8876953125, 29.05419921875, 30.220703125, 31.38720703125, 32.5537109375, 33.72021484375, 34.88671875, 36.05322265625, 37.2197265625, 38.38623046875, 39.552734375, 40.71923828125, 41.8857421875, 43.05224609375, 44.21875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 514.0, 474.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.32444763183594, -55.664268493652344, -51.004093170166016, -46.34391784667969, -41.683738708496094, -37.0235595703125, -32.36338424682617, -27.703208923339844, -23.04302978515625, -18.38285255432129, -13.722675323486328, -9.062498092651367, -4.402320861816406, 0.2578563690185547, 4.918033599853516, 9.578208923339844, 14.238388061523438, 18.8985652923584, 23.55874252319336, 28.21891975402832, 32.87909698486328, 37.539276123046875, 42.1994514465332, 46.85962677001953, 51.519805908203125, 56.17998504638672, 60.84016036987305, 65.50033569335938, 70.16051483154297, 74.82069396972656, 79.48086547851562, 84.14104461669922, 88.80122375488281, 93.4614028930664, 98.12158203125, 102.78175354003906, 107.44193267822266, 112.10211181640625, 116.76228332519531, 121.4224624633789, 126.0826416015625, 130.74281311035156, 135.4029998779297, 140.06317138671875, 144.72335815429688, 149.38352966308594, 154.043701171875, 158.70388793945312, 163.3640594482422, 168.02423095703125, 172.68441772460938, 177.34458923339844, 182.0047607421875, 186.66494750976562, 191.3251190185547, 195.98529052734375, 200.64547729492188, 205.30564880371094, 209.96583557128906, 214.62600708007812, 219.28619384765625, 223.9463653564453, 228.60653686523438, 233.2667236328125, 237.92689514160156]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 4.0, 9.0, 3.0, 9.0, 9.0, 8.0, 12.0, 15.0, 19.0, 20.0, 25.0, 24.0, 24.0, 16.0, 20.0, 26.0, 25.0, 36.0, 36.0, 39.0, 34.0, 35.0, 38.0, 46.0, 38.0, 33.0, 33.0, 32.0, 31.0, 35.0, 20.0, 36.0, 23.0, 24.0, 23.0, 24.0, 13.0, 14.0, 12.0, 6.0, 7.0, 9.0, 7.0, 7.0, 9.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0], "bins": [-34.837284088134766, -33.746849060058594, -32.65641784667969, -31.56598472595215, -30.47555160522461, -29.38511848449707, -28.29468536376953, -27.20425033569336, -26.113819122314453, -25.023386001586914, -23.932952880859375, -22.842519760131836, -21.752086639404297, -20.661653518676758, -19.57122039794922, -18.480785369873047, -17.390352249145508, -16.29991912841797, -15.20948600769043, -14.11905288696289, -13.028619766235352, -11.938186645507812, -10.847752571105957, -9.757319450378418, -8.666886329650879, -7.57645320892334, -6.486020088195801, -5.3955864906311035, -4.3051533699035645, -3.2147202491760254, -2.124286651611328, -1.033853530883789, 0.05657958984375, 1.1470128297805786, 2.2374460697174072, 3.3278794288635254, 4.4183125495910645, 5.5087456703186035, 6.599179267883301, 7.68961238861084, 8.780045509338379, 9.870478630065918, 10.960911750793457, 12.051345825195312, 13.141778945922852, 14.23221206665039, 15.32264518737793, 16.41307830810547, 17.503511428833008, 18.593944549560547, 19.684377670288086, 20.774810791015625, 21.865243911743164, 22.955677032470703, 24.046112060546875, 25.13654327392578, 26.226978302001953, 27.317411422729492, 28.40784454345703, 29.49827766418457, 30.58871078491211, 31.67914390563965, 32.76957702636719, 33.86001205444336, 34.950443267822266]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 6.0, 7.0, 14.0, 8.0, 7.0, 15.0, 11.0, 17.0, 21.0, 14.0, 23.0, 27.0, 31.0, 37.0, 32.0, 36.0, 40.0, 26.0, 40.0, 46.0, 42.0, 33.0, 35.0, 34.0, 31.0, 38.0, 33.0, 29.0, 28.0, 31.0, 24.0, 27.0, 18.0, 18.0, 14.0, 14.0, 17.0, 16.0, 6.0, 8.0, 9.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.5869140625, -5.392578125, -5.1982421875, -5.00390625, -4.8095703125, -4.615234375, -4.4208984375, -4.2265625, -4.0322265625, -3.837890625, -3.6435546875, -3.44921875, -3.2548828125, -3.060546875, -2.8662109375, -2.671875, -2.4775390625, -2.283203125, -2.0888671875, -1.89453125, -1.7001953125, -1.505859375, -1.3115234375, -1.1171875, -0.9228515625, -0.728515625, -0.5341796875, -0.33984375, -0.1455078125, 0.048828125, 0.2431640625, 0.4375, 0.6318359375, 0.826171875, 1.0205078125, 1.21484375, 1.4091796875, 1.603515625, 1.7978515625, 1.9921875, 2.1865234375, 2.380859375, 2.5751953125, 2.76953125, 2.9638671875, 3.158203125, 3.3525390625, 3.546875, 3.7412109375, 3.935546875, 4.1298828125, 4.32421875, 4.5185546875, 4.712890625, 4.9072265625, 5.1015625, 5.2958984375, 5.490234375, 5.6845703125, 5.87890625, 6.0732421875, 6.267578125, 6.4619140625, 6.65625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 17.0, 10.0, 12.0, 25.0, 27.0, 36.0, 45.0, 88.0, 124.0, 272.0, 562.0, 1310.0, 3861.0, 14236.0, 111318.0, 2352079.0, 1626123.0, 68044.0, 10808.0, 3115.0, 1116.0, 457.0, 196.0, 126.0, 66.0, 36.0, 27.0, 23.0, 19.0, 17.0, 17.0, 10.0, 11.0, 6.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.879638671875, -16.27490234375, -15.670166015625, -15.0654296875, -14.460693359375, -13.85595703125, -13.251220703125, -12.646484375, -12.041748046875, -11.43701171875, -10.832275390625, -10.2275390625, -9.622802734375, -9.01806640625, -8.413330078125, -7.80859375, -7.203857421875, -6.59912109375, -5.994384765625, -5.3896484375, -4.784912109375, -4.18017578125, -3.575439453125, -2.970703125, -2.365966796875, -1.76123046875, -1.156494140625, -0.5517578125, 0.052978515625, 0.65771484375, 1.262451171875, 1.8671875, 2.471923828125, 3.07666015625, 3.681396484375, 4.2861328125, 4.890869140625, 5.49560546875, 6.100341796875, 6.705078125, 7.309814453125, 7.91455078125, 8.519287109375, 9.1240234375, 9.728759765625, 10.33349609375, 10.938232421875, 11.54296875, 12.147705078125, 12.75244140625, 13.357177734375, 13.9619140625, 14.566650390625, 15.17138671875, 15.776123046875, 16.380859375, 16.985595703125, 17.59033203125, 18.195068359375, 18.7998046875, 19.404541015625, 20.00927734375, 20.614013671875, 21.21875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 3.0, 8.0, 8.0, 11.0, 13.0, 12.0, 28.0, 25.0, 29.0, 41.0, 59.0, 88.0, 127.0, 172.0, 243.0, 333.0, 471.0, 533.0, 502.0, 408.0, 267.0, 179.0, 131.0, 96.0, 73.0, 49.0, 35.0, 34.0, 18.0, 16.0, 17.0, 8.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.696044921875, -8.39208984375, -8.088134765625, -7.7841796875, -7.480224609375, -7.17626953125, -6.872314453125, -6.568359375, -6.264404296875, -5.96044921875, -5.656494140625, -5.3525390625, -5.048583984375, -4.74462890625, -4.440673828125, -4.13671875, -3.832763671875, -3.52880859375, -3.224853515625, -2.9208984375, -2.616943359375, -2.31298828125, -2.009033203125, -1.705078125, -1.401123046875, -1.09716796875, -0.793212890625, -0.4892578125, -0.185302734375, 0.11865234375, 0.422607421875, 0.7265625, 1.030517578125, 1.33447265625, 1.638427734375, 1.9423828125, 2.246337890625, 2.55029296875, 2.854248046875, 3.158203125, 3.462158203125, 3.76611328125, 4.070068359375, 4.3740234375, 4.677978515625, 4.98193359375, 5.285888671875, 5.58984375, 5.893798828125, 6.19775390625, 6.501708984375, 6.8056640625, 7.109619140625, 7.41357421875, 7.717529296875, 8.021484375, 8.325439453125, 8.62939453125, 8.933349609375, 9.2373046875, 9.541259765625, 9.84521484375, 10.149169921875, 10.453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 12.0, 10.0, 9.0, 18.0, 22.0, 27.0, 47.0, 68.0, 122.0, 199.0, 462.0, 951.0, 2524.0, 9882.0, 64205.0, 1255360.0, 2729127.0, 111346.0, 14171.0, 3314.0, 1189.0, 543.0, 268.0, 128.0, 87.0, 61.0, 37.0, 19.0, 25.0, 16.0, 11.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -21.0576171875, -20.380859375, -19.7041015625, -19.02734375, -18.3505859375, -17.673828125, -16.9970703125, -16.3203125, -15.6435546875, -14.966796875, -14.2900390625, -13.61328125, -12.9365234375, -12.259765625, -11.5830078125, -10.90625, -10.2294921875, -9.552734375, -8.8759765625, -8.19921875, -7.5224609375, -6.845703125, -6.1689453125, -5.4921875, -4.8154296875, -4.138671875, -3.4619140625, -2.78515625, -2.1083984375, -1.431640625, -0.7548828125, -0.078125, 0.5986328125, 1.275390625, 1.9521484375, 2.62890625, 3.3056640625, 3.982421875, 4.6591796875, 5.3359375, 6.0126953125, 6.689453125, 7.3662109375, 8.04296875, 8.7197265625, 9.396484375, 10.0732421875, 10.75, 11.4267578125, 12.103515625, 12.7802734375, 13.45703125, 14.1337890625, 14.810546875, 15.4873046875, 16.1640625, 16.8408203125, 17.517578125, 18.1943359375, 18.87109375, 19.5478515625, 20.224609375, 20.9013671875, 21.578125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 14.0, 63.0, 195.0, 365.0, 249.0, 94.0, 23.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.16478729248047, -119.70677185058594, -116.2487564086914, -112.79074096679688, -109.33272552490234, -105.87471008300781, -102.41669464111328, -98.95867919921875, -95.50066375732422, -92.04264831542969, -88.58463287353516, -85.12661743164062, -81.6686019897461, -78.21058654785156, -74.75257110595703, -71.2945556640625, -67.83654022216797, -64.37852478027344, -60.920509338378906, -57.462493896484375, -54.004478454589844, -50.54646301269531, -47.08844757080078, -43.63043212890625, -40.17241668701172, -36.71440124511719, -33.256385803222656, -29.798370361328125, -26.340354919433594, -22.882339477539062, -19.42432403564453, -15.96630859375, -12.508293151855469, -9.050277709960938, -5.592262268066406, -2.134246826171875, 1.3237686157226562, 4.7817840576171875, 8.239799499511719, 11.69781494140625, 15.155830383300781, 18.613845825195312, 22.071861267089844, 25.529876708984375, 28.987892150878906, 32.44590759277344, 35.90392303466797, 39.3619384765625, 42.81995391845703, 46.27796936035156, 49.735984802246094, 53.194000244140625, 56.652015686035156, 60.11003112792969, 63.56804656982422, 67.02606201171875, 70.48407745361328, 73.94209289550781, 77.40010833740234, 80.85812377929688, 84.3161392211914, 87.77415466308594, 91.23217010498047, 94.690185546875, 98.14820098876953]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 10.0, 9.0, 8.0, 9.0, 17.0, 18.0, 23.0, 21.0, 24.0, 23.0, 26.0, 32.0, 21.0, 29.0, 29.0, 36.0, 24.0, 30.0, 48.0, 32.0, 40.0, 40.0, 38.0, 37.0, 30.0, 36.0, 29.0, 22.0, 23.0, 32.0, 33.0, 23.0, 17.0, 23.0, 18.0, 14.0, 13.0, 3.0, 11.0, 9.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.51313018798828, -25.61332893371582, -24.713525772094727, -23.813724517822266, -22.913921356201172, -22.01412010192871, -21.11431884765625, -20.214515686035156, -19.314714431762695, -18.414913177490234, -17.51511001586914, -16.61530876159668, -15.715506553649902, -14.815704345703125, -13.915903091430664, -13.016100883483887, -12.11629867553711, -11.216496467590332, -10.316694259643555, -9.416893005371094, -8.517090797424316, -7.617288589477539, -6.71748685836792, -5.817685127258301, -4.917882919311523, -4.018080711364746, -3.118278980255127, -2.2184770107269287, -1.3186750411987305, -0.4188728332519531, 0.480928897857666, 1.3807306289672852, 2.2805328369140625, 3.1803348064422607, 4.080136775970459, 4.979938507080078, 5.8797407150268555, 6.779542922973633, 7.679344654083252, 8.579146385192871, 9.478948593139648, 10.378750801086426, 11.278553009033203, 12.178354263305664, 13.078156471252441, 13.977958679199219, 14.87775993347168, 15.777562141418457, 16.677364349365234, 17.577165603637695, 18.47696876525879, 19.37677001953125, 20.276573181152344, 21.176374435424805, 22.076175689697266, 22.97597885131836, 23.87578010559082, 24.77558135986328, 25.675384521484375, 26.575185775756836, 27.474987030029297, 28.37479019165039, 29.27459144592285, 30.174392700195312, 31.074195861816406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 17.0, 9.0, 11.0, 14.0, 21.0, 17.0, 32.0, 21.0, 32.0, 28.0, 18.0, 40.0, 40.0, 38.0, 36.0, 39.0, 32.0, 32.0, 41.0, 33.0, 38.0, 41.0, 37.0, 32.0, 27.0, 32.0, 26.0, 28.0, 21.0, 17.0, 17.0, 13.0, 17.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.03515625, -5.8359375, -5.63671875, -5.4375, -5.23828125, -5.0390625, -4.83984375, -4.640625, -4.44140625, -4.2421875, -4.04296875, -3.84375, -3.64453125, -3.4453125, -3.24609375, -3.046875, -2.84765625, -2.6484375, -2.44921875, -2.25, -2.05078125, -1.8515625, -1.65234375, -1.453125, -1.25390625, -1.0546875, -0.85546875, -0.65625, -0.45703125, -0.2578125, -0.05859375, 0.140625, 0.33984375, 0.5390625, 0.73828125, 0.9375, 1.13671875, 1.3359375, 1.53515625, 1.734375, 1.93359375, 2.1328125, 2.33203125, 2.53125, 2.73046875, 2.9296875, 3.12890625, 3.328125, 3.52734375, 3.7265625, 3.92578125, 4.125, 4.32421875, 4.5234375, 4.72265625, 4.921875, 5.12109375, 5.3203125, 5.51953125, 5.71875, 5.91796875, 6.1171875, 6.31640625, 6.515625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 15.0, 25.0, 29.0, 33.0, 70.0, 97.0, 161.0, 222.0, 325.0, 479.0, 764.0, 1124.0, 1699.0, 2473.0, 3792.0, 5855.0, 8868.0, 13828.0, 21026.0, 33838.0, 55115.0, 91566.0, 150865.0, 209461.0, 170818.0, 105179.0, 63770.0, 38976.0, 23965.0, 15091.0, 9728.0, 6466.0, 4293.0, 2856.0, 1822.0, 1255.0, 837.0, 574.0, 400.0, 256.0, 180.0, 131.0, 78.0, 45.0, 34.0, 26.0, 14.0, 5.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8173828125, -0.7907028198242188, -0.7640228271484375, -0.7373428344726562, -0.710662841796875, -0.6839828491210938, -0.6573028564453125, -0.6306228637695312, -0.60394287109375, -0.5772628784179688, -0.5505828857421875, -0.5239028930664062, -0.497222900390625, -0.47054290771484375, -0.4438629150390625, -0.41718292236328125, -0.3905029296875, -0.36382293701171875, -0.3371429443359375, -0.31046295166015625, -0.283782958984375, -0.25710296630859375, -0.2304229736328125, -0.20374298095703125, -0.17706298828125, -0.15038299560546875, -0.1237030029296875, -0.09702301025390625, -0.070343017578125, -0.04366302490234375, -0.0169830322265625, 0.00969696044921875, 0.036376953125, 0.06305694580078125, 0.0897369384765625, 0.11641693115234375, 0.143096923828125, 0.16977691650390625, 0.1964569091796875, 0.22313690185546875, 0.24981689453125, 0.27649688720703125, 0.3031768798828125, 0.32985687255859375, 0.356536865234375, 0.38321685791015625, 0.4098968505859375, 0.43657684326171875, 0.4632568359375, 0.48993682861328125, 0.5166168212890625, 0.5432968139648438, 0.569976806640625, 0.5966567993164062, 0.6233367919921875, 0.6500167846679688, 0.67669677734375, 0.7033767700195312, 0.7300567626953125, 0.7567367553710938, 0.783416748046875, 0.8100967407226562, 0.8367767333984375, 0.8634567260742188, 0.89013671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 4.0, 5.0, 11.0, 15.0, 11.0, 11.0, 23.0, 16.0, 26.0, 14.0, 28.0, 32.0, 23.0, 28.0, 37.0, 24.0, 34.0, 38.0, 41.0, 35.0, 1056.0, 37.0, 44.0, 46.0, 36.0, 26.0, 32.0, 20.0, 23.0, 30.0, 17.0, 30.0, 25.0, 17.0, 18.0, 14.0, 15.0, 12.0, 9.0, 3.0, 7.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.947265625, -3.82916259765625, -3.7110595703125, -3.59295654296875, -3.474853515625, -3.35675048828125, -3.2386474609375, -3.12054443359375, -3.00244140625, -2.88433837890625, -2.7662353515625, -2.64813232421875, -2.530029296875, -2.41192626953125, -2.2938232421875, -2.17572021484375, -2.0576171875, -1.93951416015625, -1.8214111328125, -1.70330810546875, -1.585205078125, -1.46710205078125, -1.3489990234375, -1.23089599609375, -1.11279296875, -0.99468994140625, -0.8765869140625, -0.75848388671875, -0.640380859375, -0.52227783203125, -0.4041748046875, -0.28607177734375, -0.16796875, -0.04986572265625, 0.0682373046875, 0.18634033203125, 0.304443359375, 0.42254638671875, 0.5406494140625, 0.65875244140625, 0.77685546875, 0.89495849609375, 1.0130615234375, 1.13116455078125, 1.249267578125, 1.36737060546875, 1.4854736328125, 1.60357666015625, 1.7216796875, 1.83978271484375, 1.9578857421875, 2.07598876953125, 2.194091796875, 2.31219482421875, 2.4302978515625, 2.54840087890625, 2.66650390625, 2.78460693359375, 2.9027099609375, 3.02081298828125, 3.138916015625, 3.25701904296875, 3.3751220703125, 3.49322509765625, 3.611328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 9.0, 13.0, 23.0, 30.0, 51.0, 66.0, 124.0, 198.0, 330.0, 490.0, 734.0, 1227.0, 1997.0, 3299.0, 5399.0, 8884.0, 14799.0, 25152.0, 42918.0, 74204.0, 129930.0, 240808.0, 1223232.0, 134986.0, 77447.0, 45035.0, 26078.0, 15774.0, 9265.0, 5676.0, 3469.0, 2022.0, 1263.0, 800.0, 528.0, 295.0, 184.0, 141.0, 86.0, 51.0, 45.0, 18.0, 13.0, 9.0, 3.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.810546875, -0.7867355346679688, -0.7629241943359375, -0.7391128540039062, -0.715301513671875, -0.6914901733398438, -0.6676788330078125, -0.6438674926757812, -0.62005615234375, -0.5962448120117188, -0.5724334716796875, -0.5486221313476562, -0.524810791015625, -0.5009994506835938, -0.4771881103515625, -0.45337677001953125, -0.4295654296875, -0.40575408935546875, -0.3819427490234375, -0.35813140869140625, -0.334320068359375, -0.31050872802734375, -0.2866973876953125, -0.26288604736328125, -0.23907470703125, -0.21526336669921875, -0.1914520263671875, -0.16764068603515625, -0.143829345703125, -0.12001800537109375, -0.0962066650390625, -0.07239532470703125, -0.048583984375, -0.02477264404296875, -0.0009613037109375, 0.02285003662109375, 0.046661376953125, 0.07047271728515625, 0.0942840576171875, 0.11809539794921875, 0.14190673828125, 0.16571807861328125, 0.1895294189453125, 0.21334075927734375, 0.237152099609375, 0.26096343994140625, 0.2847747802734375, 0.30858612060546875, 0.3323974609375, 0.35620880126953125, 0.3800201416015625, 0.40383148193359375, 0.427642822265625, 0.45145416259765625, 0.4752655029296875, 0.49907684326171875, 0.52288818359375, 0.5466995239257812, 0.5705108642578125, 0.5943222045898438, 0.618133544921875, 0.6419448852539062, 0.6657562255859375, 0.6895675659179688, 0.71337890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 12.0, 19.0, 18.0, 23.0, 42.0, 55.0, 56.0, 53.0, 67.0, 72.0, 85.0, 68.0, 74.0, 53.0, 62.0, 45.0, 33.0, 37.0, 20.0, 17.0, 14.0, 20.0, 7.0, 2.0, 6.0, 7.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028076171875, -0.002715975046157837, -0.002624332904815674, -0.0025326907634735107, -0.0024410486221313477, -0.0023494064807891846, -0.0022577643394470215, -0.0021661221981048584, -0.0020744800567626953, -0.0019828379154205322, -0.0018911957740783691, -0.001799553632736206, -0.001707911491394043, -0.0016162693500518799, -0.0015246272087097168, -0.0014329850673675537, -0.0013413429260253906, -0.0012497007846832275, -0.0011580586433410645, -0.0010664165019989014, -0.0009747743606567383, -0.0008831322193145752, -0.0007914900779724121, -0.000699847936630249, -0.0006082057952880859, -0.0005165636539459229, -0.00042492151260375977, -0.0003332793712615967, -0.0002416372299194336, -0.0001499950885772705, -5.835294723510742e-05, 3.3289194107055664e-05, 0.00012493133544921875, 0.00021657347679138184, 0.0003082156181335449, 0.000399857759475708, 0.0004914999008178711, 0.0005831420421600342, 0.0006747841835021973, 0.0007664263248443604, 0.0008580684661865234, 0.0009497106075286865, 0.0010413527488708496, 0.0011329948902130127, 0.0012246370315551758, 0.0013162791728973389, 0.001407921314239502, 0.001499563455581665, 0.0015912055969238281, 0.0016828477382659912, 0.0017744898796081543, 0.0018661320209503174, 0.0019577741622924805, 0.0020494163036346436, 0.0021410584449768066, 0.0022327005863189697, 0.002324342727661133, 0.002415984869003296, 0.002507627010345459, 0.002599269151687622, 0.002690911293029785, 0.0027825534343719482, 0.0028741955757141113, 0.0029658377170562744, 0.0030574798583984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 11.0, 20.0, 24.0, 27.0, 54.0, 52.0, 66.0, 92.0, 141.0, 222.0, 425.0, 1038.0, 203211.0, 840326.0, 1555.0, 460.0, 262.0, 165.0, 83.0, 86.0, 65.0, 38.0, 17.0, 24.0, 10.0, 13.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06024169921875, -0.05842161178588867, -0.056601524353027344, -0.054781436920166016, -0.05296134948730469, -0.05114126205444336, -0.04932117462158203, -0.0475010871887207, -0.045680999755859375, -0.04386091232299805, -0.04204082489013672, -0.04022073745727539, -0.03840065002441406, -0.036580562591552734, -0.034760475158691406, -0.03294038772583008, -0.03112030029296875, -0.029300212860107422, -0.027480125427246094, -0.025660037994384766, -0.023839950561523438, -0.02201986312866211, -0.02019977569580078, -0.018379688262939453, -0.016559600830078125, -0.014739513397216797, -0.012919425964355469, -0.01109933853149414, -0.009279251098632812, -0.007459163665771484, -0.005639076232910156, -0.003818988800048828, -0.0019989013671875, -0.00017881393432617188, 0.0016412734985351562, 0.0034613609313964844, 0.0052814483642578125, 0.007101535797119141, 0.008921623229980469, 0.010741710662841797, 0.012561798095703125, 0.014381885528564453, 0.01620197296142578, 0.01802206039428711, 0.019842147827148438, 0.021662235260009766, 0.023482322692871094, 0.025302410125732422, 0.02712249755859375, 0.028942584991455078, 0.030762672424316406, 0.032582759857177734, 0.03440284729003906, 0.03622293472290039, 0.03804302215576172, 0.03986310958862305, 0.041683197021484375, 0.0435032844543457, 0.04532337188720703, 0.04714345932006836, 0.04896354675292969, 0.050783634185791016, 0.052603721618652344, 0.05442380905151367, 0.056243896484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 11.0, 36.0, 120.0, 277.0, 344.0, 165.0, 44.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007026367820799351, -0.0005662731127813458, -0.00042990950169041753, -0.00029354586149565876, -0.00015718222130089998, -2.0818552002310753e-05, 0.00011554505908861756, 0.0002519086701795459, 0.0003882723394781351, 0.0005246360087767243, 0.0006609996198676527, 0.000797363230958581, 0.0009337269002571702, 0.0010700905695557594, 0.0012064541224390268, 0.001342817791737616, 0.0014791814610362053, 0.0016155451303347945, 0.0017519087996333838, 0.0018882723525166512, 0.002024636138230562, 0.0021609996911138296, 0.002297363243997097, 0.002433727029711008, 0.0025700905825942755, 0.002706454135477543, 0.002842817921191454, 0.0029791814740747213, 0.0031155450269579887, 0.0032519088126719, 0.003388272365555167, 0.0035246359184384346, 0.0036609992384910583, 0.0037973627913743258, 0.003933726344257593, 0.004070090129971504, 0.004206453915685415, 0.004342817701399326, 0.00447918102145195, 0.004615544807165861, 0.004751908592879772, 0.004888272378593683, 0.005024635698646307, 0.005160999484360218, 0.005297363270074129, 0.00543372705578804, 0.005570090375840664, 0.005706454161554575, 0.005842817481607199, 0.00597918126732111, 0.0061155445873737335, 0.006251908373087645, 0.006388272158801556, 0.006524635478854179, 0.0066609992645680904, 0.0067973630502820015, 0.006933726370334625, 0.007070090156048536, 0.00720645347610116, 0.007342817261815071, 0.007479181047528982, 0.007615544833242893, 0.007751908153295517, 0.00788827147334814, 0.008024635724723339]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 3.0, 8.0, 11.0, 9.0, 19.0, 14.0, 12.0, 10.0, 18.0, 14.0, 25.0, 15.0, 29.0, 27.0, 43.0, 29.0, 30.0, 38.0, 39.0, 43.0, 44.0, 40.0, 43.0, 47.0, 32.0, 33.0, 37.0, 40.0, 27.0, 22.0, 33.0, 23.0, 22.0, 15.0, 26.0, 15.0, 14.0, 11.0, 7.0, 9.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013598799705505371, -0.0013212459161877632, -0.0012826118618249893, -0.0012439778074622154, -0.0012053437530994415, -0.0011667096987366676, -0.0011280756443738937, -0.0010894415900111198, -0.001050807535648346, -0.001012173481285572, -0.0009735394269227982, -0.0009349053725600243, -0.0008962713181972504, -0.0008576372638344765, -0.0008190032094717026, -0.0007803691551089287, -0.0007417351007461548, -0.0007031010463833809, -0.000664466992020607, -0.0006258329376578331, -0.0005871988832950592, -0.0005485648289322853, -0.0005099307745695114, -0.0004712967202067375, -0.0004326626658439636, -0.00039402861148118973, -0.00035539455711841583, -0.00031676050275564194, -0.00027812644839286804, -0.00023949239403009415, -0.00020085833966732025, -0.00016222428530454636, -0.00012359023094177246, -8.495617657899857e-05, -4.632212221622467e-05, -7.688067853450775e-06, 3.094598650932312e-05, 6.958004087209702e-05, 0.00010821409523487091, 0.0001468481495976448, 0.0001854822039604187, 0.0002241162583231926, 0.0002627503126859665, 0.0003013843670487404, 0.0003400184214115143, 0.0003786524757742882, 0.00041728653013706207, 0.00045592058449983597, 0.0004945546388626099, 0.0005331886932253838, 0.0005718227475881577, 0.0006104568019509315, 0.0006490908563137054, 0.0006877249106764793, 0.0007263589650392532, 0.0007649930194020271, 0.000803627073764801, 0.0008422611281275749, 0.0008808951824903488, 0.0009195292368531227, 0.0009581632912158966, 0.0009967973455786705, 0.0010354313999414444, 0.0010740654543042183, 0.0011126995086669922]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 17.0, 9.0, 11.0, 14.0, 21.0, 17.0, 32.0, 21.0, 32.0, 28.0, 18.0, 40.0, 40.0, 38.0, 36.0, 39.0, 32.0, 32.0, 41.0, 33.0, 38.0, 41.0, 37.0, 32.0, 27.0, 32.0, 26.0, 28.0, 21.0, 17.0, 17.0, 13.0, 17.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.03515625, -5.8359375, -5.63671875, -5.4375, -5.23828125, -5.0390625, -4.83984375, -4.640625, -4.44140625, -4.2421875, -4.04296875, -3.84375, -3.64453125, -3.4453125, -3.24609375, -3.046875, -2.84765625, -2.6484375, -2.44921875, -2.25, -2.05078125, -1.8515625, -1.65234375, -1.453125, -1.25390625, -1.0546875, -0.85546875, -0.65625, -0.45703125, -0.2578125, -0.05859375, 0.140625, 0.33984375, 0.5390625, 0.73828125, 0.9375, 1.13671875, 1.3359375, 1.53515625, 1.734375, 1.93359375, 2.1328125, 2.33203125, 2.53125, 2.73046875, 2.9296875, 3.12890625, 3.328125, 3.52734375, 3.7265625, 3.92578125, 4.125, 4.32421875, 4.5234375, 4.72265625, 4.921875, 5.12109375, 5.3203125, 5.51953125, 5.71875, 5.91796875, 6.1171875, 6.31640625, 6.515625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 34.0, 34.0, 49.0, 70.0, 102.0, 101.0, 172.0, 240.0, 344.0, 457.0, 665.0, 1062.0, 1912.0, 3571.0, 7290.0, 17513.0, 46002.0, 136100.0, 388499.0, 290937.0, 94208.0, 33127.0, 12872.0, 5707.0, 2863.0, 1537.0, 946.0, 615.0, 413.0, 288.0, 232.0, 144.0, 112.0, 99.0, 55.0, 41.0, 31.0, 19.0, 20.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.9921875, -7.748779296875, -7.50537109375, -7.261962890625, -7.0185546875, -6.775146484375, -6.53173828125, -6.288330078125, -6.044921875, -5.801513671875, -5.55810546875, -5.314697265625, -5.0712890625, -4.827880859375, -4.58447265625, -4.341064453125, -4.09765625, -3.854248046875, -3.61083984375, -3.367431640625, -3.1240234375, -2.880615234375, -2.63720703125, -2.393798828125, -2.150390625, -1.906982421875, -1.66357421875, -1.420166015625, -1.1767578125, -0.933349609375, -0.68994140625, -0.446533203125, -0.203125, 0.040283203125, 0.28369140625, 0.527099609375, 0.7705078125, 1.013916015625, 1.25732421875, 1.500732421875, 1.744140625, 1.987548828125, 2.23095703125, 2.474365234375, 2.7177734375, 2.961181640625, 3.20458984375, 3.447998046875, 3.69140625, 3.934814453125, 4.17822265625, 4.421630859375, 4.6650390625, 4.908447265625, 5.15185546875, 5.395263671875, 5.638671875, 5.882080078125, 6.12548828125, 6.368896484375, 6.6123046875, 6.855712890625, 7.09912109375, 7.342529296875, 7.5859375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 1.0, 3.0, 7.0, 12.0, 11.0, 16.0, 12.0, 18.0, 13.0, 23.0, 18.0, 27.0, 34.0, 30.0, 36.0, 58.0, 71.0, 77.0, 152.0, 1402.0, 370.0, 155.0, 91.0, 62.0, 41.0, 61.0, 28.0, 34.0, 31.0, 32.0, 22.0, 15.0, 18.0, 8.0, 9.0, 9.0, 9.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-18.421875, -17.879638671875, -17.33740234375, -16.795166015625, -16.2529296875, -15.710693359375, -15.16845703125, -14.626220703125, -14.083984375, -13.541748046875, -12.99951171875, -12.457275390625, -11.9150390625, -11.372802734375, -10.83056640625, -10.288330078125, -9.74609375, -9.203857421875, -8.66162109375, -8.119384765625, -7.5771484375, -7.034912109375, -6.49267578125, -5.950439453125, -5.408203125, -4.865966796875, -4.32373046875, -3.781494140625, -3.2392578125, -2.697021484375, -2.15478515625, -1.612548828125, -1.0703125, -0.528076171875, 0.01416015625, 0.556396484375, 1.0986328125, 1.640869140625, 2.18310546875, 2.725341796875, 3.267578125, 3.809814453125, 4.35205078125, 4.894287109375, 5.4365234375, 5.978759765625, 6.52099609375, 7.063232421875, 7.60546875, 8.147705078125, 8.68994140625, 9.232177734375, 9.7744140625, 10.316650390625, 10.85888671875, 11.401123046875, 11.943359375, 12.485595703125, 13.02783203125, 13.570068359375, 14.1123046875, 14.654541015625, 15.19677734375, 15.739013671875, 16.28125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 9.0, 6.0, 16.0, 17.0, 16.0, 23.0, 27.0, 32.0, 40.0, 41.0, 78.0, 118.0, 164.0, 222.0, 372.0, 667.0, 2887.0, 50415.0, 2964031.0, 119874.0, 4577.0, 837.0, 373.0, 234.0, 149.0, 118.0, 82.0, 64.0, 56.0, 33.0, 24.0, 31.0, 16.0, 9.0, 6.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.125, -26.1767578125, -25.228515625, -24.2802734375, -23.33203125, -22.3837890625, -21.435546875, -20.4873046875, -19.5390625, -18.5908203125, -17.642578125, -16.6943359375, -15.74609375, -14.7978515625, -13.849609375, -12.9013671875, -11.953125, -11.0048828125, -10.056640625, -9.1083984375, -8.16015625, -7.2119140625, -6.263671875, -5.3154296875, -4.3671875, -3.4189453125, -2.470703125, -1.5224609375, -0.57421875, 0.3740234375, 1.322265625, 2.2705078125, 3.21875, 4.1669921875, 5.115234375, 6.0634765625, 7.01171875, 7.9599609375, 8.908203125, 9.8564453125, 10.8046875, 11.7529296875, 12.701171875, 13.6494140625, 14.59765625, 15.5458984375, 16.494140625, 17.4423828125, 18.390625, 19.3388671875, 20.287109375, 21.2353515625, 22.18359375, 23.1318359375, 24.080078125, 25.0283203125, 25.9765625, 26.9248046875, 27.873046875, 28.8212890625, 29.76953125, 30.7177734375, 31.666015625, 32.6142578125, 33.5625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.0, 832.0, 128.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.935203552246094, -56.08351135253906, -50.23181915283203, -44.380123138427734, -38.5284309387207, -32.67673873901367, -26.825042724609375, -20.973350524902344, -15.121658325195312, -9.269965171813965, -3.418272018432617, 2.433422088623047, 8.285114288330078, 14.13680648803711, 19.988502502441406, 25.840194702148438, 31.69188690185547, 37.5435791015625, 43.39527130126953, 49.24696731567383, 55.09865951538086, 60.95035171508789, 66.80204772949219, 72.65373992919922, 78.50543212890625, 84.35712432861328, 90.20881652832031, 96.06051635742188, 101.91220092773438, 107.76390075683594, 113.61559295654297, 119.46728515625, 125.3189697265625, 131.17066955566406, 137.02235412597656, 142.87405395507812, 148.72573852539062, 154.5774383544922, 160.42913818359375, 166.28082275390625, 172.13250732421875, 177.9842071533203, 183.8358917236328, 189.68759155273438, 195.53927612304688, 201.39097595214844, 207.24267578125, 213.0943603515625, 218.94606018066406, 224.79776000976562, 230.64944458007812, 236.5011444091797, 242.3528289794922, 248.20452880859375, 254.05621337890625, 259.90789794921875, 265.7596130371094, 271.6112976074219, 277.4630126953125, 283.314697265625, 289.1663818359375, 295.01806640625, 300.8697814941406, 306.7214660644531, 312.5731506347656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 10.0, 15.0, 12.0, 7.0, 16.0, 20.0, 25.0, 22.0, 36.0, 33.0, 23.0, 35.0, 41.0, 49.0, 32.0, 47.0, 36.0, 46.0, 54.0, 33.0, 34.0, 36.0, 30.0, 30.0, 36.0, 32.0, 26.0, 25.0, 29.0, 26.0, 27.0, 12.0, 12.0, 7.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.90922546386719, -37.681705474853516, -36.45418930053711, -35.22666931152344, -33.99915313720703, -32.77163314819336, -31.544113159179688, -30.31659507751465, -29.08907699584961, -27.86155891418457, -26.63404083251953, -25.40652084350586, -24.17900276184082, -22.95148468017578, -21.72396469116211, -20.49644660949707, -19.26892852783203, -18.041410446166992, -16.813892364501953, -15.586372375488281, -14.358854293823242, -13.131336212158203, -11.903817176818848, -10.676298141479492, -9.448780059814453, -8.221261978149414, -6.993742942810059, -5.766224384307861, -4.538705825805664, -3.311187267303467, -2.0836687088012695, -0.8561496734619141, 0.3713645935058594, 1.5988831520080566, 2.826401710510254, 4.053920269012451, 5.281438827514648, 6.508957386016846, 7.736475944519043, 8.963994979858398, 10.191513061523438, 11.419031143188477, 12.646550178527832, 13.874069213867188, 15.101587295532227, 16.329105377197266, 17.556625366210938, 18.784143447875977, 20.011661529541016, 21.239179611206055, 22.466697692871094, 23.694217681884766, 24.921735763549805, 26.149253845214844, 27.376773834228516, 28.604291915893555, 29.831809997558594, 31.059328079223633, 32.28684616088867, 33.514366149902344, 34.74188232421875, 35.96940231323242, 37.196922302246094, 38.4244384765625, 39.65195846557617]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 12.0, 15.0, 12.0, 9.0, 13.0, 25.0, 23.0, 26.0, 36.0, 22.0, 33.0, 37.0, 33.0, 46.0, 46.0, 42.0, 40.0, 37.0, 40.0, 39.0, 35.0, 47.0, 49.0, 29.0, 35.0, 30.0, 29.0, 16.0, 26.0, 16.0, 17.0, 17.0, 11.0, 15.0, 11.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.42071533203125, -6.1968994140625, -5.97308349609375, -5.749267578125, -5.52545166015625, -5.3016357421875, -5.07781982421875, -4.85400390625, -4.63018798828125, -4.4063720703125, -4.18255615234375, -3.958740234375, -3.73492431640625, -3.5111083984375, -3.28729248046875, -3.0634765625, -2.83966064453125, -2.6158447265625, -2.39202880859375, -2.168212890625, -1.94439697265625, -1.7205810546875, -1.49676513671875, -1.27294921875, -1.04913330078125, -0.8253173828125, -0.60150146484375, -0.377685546875, -0.15386962890625, 0.0699462890625, 0.29376220703125, 0.517578125, 0.74139404296875, 0.9652099609375, 1.18902587890625, 1.412841796875, 1.63665771484375, 1.8604736328125, 2.08428955078125, 2.30810546875, 2.53192138671875, 2.7557373046875, 2.97955322265625, 3.203369140625, 3.42718505859375, 3.6510009765625, 3.87481689453125, 4.0986328125, 4.32244873046875, 4.5462646484375, 4.77008056640625, 4.993896484375, 5.21771240234375, 5.4415283203125, 5.66534423828125, 5.88916015625, 6.11297607421875, 6.3367919921875, 6.56060791015625, 6.784423828125, 7.00823974609375, 7.2320556640625, 7.45587158203125, 7.6796875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 4.0, 11.0, 14.0, 19.0, 11.0, 28.0, 39.0, 44.0, 59.0, 67.0, 105.0, 131.0, 219.0, 278.0, 395.0, 477.0, 3671.0, 4185128.0, 1776.0, 468.0, 335.0, 261.0, 192.0, 135.0, 93.0, 77.0, 47.0, 34.0, 31.0, 27.0, 26.0, 22.0, 10.0, 7.0, 9.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.375, -146.23046875, -141.0859375, -135.94140625, -130.796875, -125.65234375, -120.5078125, -115.36328125, -110.21875, -105.07421875, -99.9296875, -94.78515625, -89.640625, -84.49609375, -79.3515625, -74.20703125, -69.0625, -63.91796875, -58.7734375, -53.62890625, -48.484375, -43.33984375, -38.1953125, -33.05078125, -27.90625, -22.76171875, -17.6171875, -12.47265625, -7.328125, -2.18359375, 2.9609375, 8.10546875, 13.25, 18.39453125, 23.5390625, 28.68359375, 33.828125, 38.97265625, 44.1171875, 49.26171875, 54.40625, 59.55078125, 64.6953125, 69.83984375, 74.984375, 80.12890625, 85.2734375, 90.41796875, 95.5625, 100.70703125, 105.8515625, 110.99609375, 116.140625, 121.28515625, 126.4296875, 131.57421875, 136.71875, 141.86328125, 147.0078125, 152.15234375, 157.296875, 162.44140625, 167.5859375, 172.73046875, 177.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 17.0, 14.0, 25.0, 49.0, 83.0, 121.0, 270.0, 508.0, 1006.0, 1008.0, 459.0, 226.0, 110.0, 61.0, 37.0, 33.0, 11.0, 10.0, 6.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.418212890625, -13.78955078125, -13.160888671875, -12.5322265625, -11.903564453125, -11.27490234375, -10.646240234375, -10.017578125, -9.388916015625, -8.76025390625, -8.131591796875, -7.5029296875, -6.874267578125, -6.24560546875, -5.616943359375, -4.98828125, -4.359619140625, -3.73095703125, -3.102294921875, -2.4736328125, -1.844970703125, -1.21630859375, -0.587646484375, 0.041015625, 0.669677734375, 1.29833984375, 1.927001953125, 2.5556640625, 3.184326171875, 3.81298828125, 4.441650390625, 5.0703125, 5.698974609375, 6.32763671875, 6.956298828125, 7.5849609375, 8.213623046875, 8.84228515625, 9.470947265625, 10.099609375, 10.728271484375, 11.35693359375, 11.985595703125, 12.6142578125, 13.242919921875, 13.87158203125, 14.500244140625, 15.12890625, 15.757568359375, 16.38623046875, 17.014892578125, 17.6435546875, 18.272216796875, 18.90087890625, 19.529541015625, 20.158203125, 20.786865234375, 21.41552734375, 22.044189453125, 22.6728515625, 23.301513671875, 23.93017578125, 24.558837890625, 25.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 17.0, 19.0, 21.0, 14.0, 31.0, 37.0, 65.0, 83.0, 117.0, 479.0, 99437.0, 4092251.0, 1212.0, 172.0, 92.0, 52.0, 48.0, 36.0, 25.0, 17.0, 19.0, 16.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.0, -140.32421875, -136.6484375, -132.97265625, -129.296875, -125.62109375, -121.9453125, -118.26953125, -114.59375, -110.91796875, -107.2421875, -103.56640625, -99.890625, -96.21484375, -92.5390625, -88.86328125, -85.1875, -81.51171875, -77.8359375, -74.16015625, -70.484375, -66.80859375, -63.1328125, -59.45703125, -55.78125, -52.10546875, -48.4296875, -44.75390625, -41.078125, -37.40234375, -33.7265625, -30.05078125, -26.375, -22.69921875, -19.0234375, -15.34765625, -11.671875, -7.99609375, -4.3203125, -0.64453125, 3.03125, 6.70703125, 10.3828125, 14.05859375, 17.734375, 21.41015625, 25.0859375, 28.76171875, 32.4375, 36.11328125, 39.7890625, 43.46484375, 47.140625, 50.81640625, 54.4921875, 58.16796875, 61.84375, 65.51953125, 69.1953125, 72.87109375, 76.546875, 80.22265625, 83.8984375, 87.57421875, 91.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 44.0, 430.0, 460.0, 75.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.61212158203125, -81.81055450439453, -76.00898742675781, -70.20741271972656, -64.40585327148438, -58.60428237915039, -52.802711486816406, -47.00114440917969, -41.19957733154297, -35.39801025390625, -29.5964412689209, -23.794872283935547, -17.993305206298828, -12.19173812866211, -6.390167236328125, -0.5886001586914062, 5.2129669189453125, 11.014534950256348, 16.816102981567383, 22.617671966552734, 28.419239044189453, 34.22080612182617, 40.022377014160156, 45.823944091796875, 51.625511169433594, 57.42707824707031, 63.22864532470703, 69.03021240234375, 74.831787109375, 80.63334655761719, 86.43492126464844, 92.23648834228516, 98.03805541992188, 103.8396224975586, 109.64118957519531, 115.44276428222656, 121.24432373046875, 127.0458984375, 132.84747314453125, 138.64903259277344, 144.45059204101562, 150.25216674804688, 156.05372619628906, 161.8553009033203, 167.6568603515625, 173.45843505859375, 179.260009765625, 185.0615692138672, 190.86314392089844, 196.6647186279297, 202.46627807617188, 208.26785278320312, 214.0694122314453, 219.87098693847656, 225.67254638671875, 231.47412109375, 237.27569580078125, 243.0772705078125, 248.8788299560547, 254.68040466308594, 260.4819641113281, 266.2835388183594, 272.0851135253906, 277.88665771484375, 283.688232421875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 14.0, 15.0, 18.0, 18.0, 21.0, 27.0, 24.0, 21.0, 33.0, 32.0, 46.0, 49.0, 36.0, 44.0, 51.0, 34.0, 49.0, 55.0, 44.0, 43.0, 29.0, 29.0, 32.0, 32.0, 30.0, 21.0, 24.0, 15.0, 19.0, 14.0, 19.0, 6.0, 6.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.53916931152344, -41.313228607177734, -40.08728790283203, -38.861351013183594, -37.63541030883789, -36.40946960449219, -35.183528900146484, -33.95758819580078, -32.731651306152344, -31.50571060180664, -30.27977180480957, -29.053831100463867, -27.827892303466797, -26.601951599121094, -25.37601089477539, -24.15007209777832, -22.924131393432617, -21.698190689086914, -20.472251892089844, -19.24631118774414, -18.02037239074707, -16.794431686401367, -15.56849193572998, -14.342552185058594, -13.116612434387207, -11.89067268371582, -10.664732933044434, -9.438793182373047, -8.212852478027344, -6.986913204193115, -5.76097297668457, -4.535033226013184, -3.309093475341797, -2.08315372467041, -0.8572137355804443, 0.3687262535095215, 1.5946660041809082, 2.820605754852295, 4.04654598236084, 5.272485733032227, 6.498425483703613, 7.724365234375, 8.950304985046387, 10.176244735717773, 11.402185440063477, 12.628124237060547, 13.85406494140625, 15.080004692077637, 16.305944442749023, 17.531885147094727, 18.757823944091797, 19.9837646484375, 21.20970344543457, 22.435644149780273, 23.661582946777344, 24.887523651123047, 26.11346435546875, 27.339405059814453, 28.565343856811523, 29.791284561157227, 31.017223358154297, 32.2431640625, 33.4691047668457, 34.695045471191406, 35.920982360839844]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 20.0, 26.0, 22.0, 23.0, 32.0, 33.0, 30.0, 28.0, 34.0, 37.0, 36.0, 48.0, 55.0, 43.0, 45.0, 41.0, 24.0, 32.0, 41.0, 38.0, 30.0, 22.0, 33.0, 27.0, 29.0, 24.0, 22.0, 17.0, 19.0, 9.0, 3.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.2928466796875, -6.073974609375, -5.8551025390625, -5.63623046875, -5.4173583984375, -5.198486328125, -4.9796142578125, -4.7607421875, -4.5418701171875, -4.322998046875, -4.1041259765625, -3.88525390625, -3.6663818359375, -3.447509765625, -3.2286376953125, -3.009765625, -2.7908935546875, -2.572021484375, -2.3531494140625, -2.13427734375, -1.9154052734375, -1.696533203125, -1.4776611328125, -1.2587890625, -1.0399169921875, -0.821044921875, -0.6021728515625, -0.38330078125, -0.1644287109375, 0.054443359375, 0.2733154296875, 0.4921875, 0.7110595703125, 0.929931640625, 1.1488037109375, 1.36767578125, 1.5865478515625, 1.805419921875, 2.0242919921875, 2.2431640625, 2.4620361328125, 2.680908203125, 2.8997802734375, 3.11865234375, 3.3375244140625, 3.556396484375, 3.7752685546875, 3.994140625, 4.2130126953125, 4.431884765625, 4.6507568359375, 4.86962890625, 5.0885009765625, 5.307373046875, 5.5262451171875, 5.7451171875, 5.9639892578125, 6.182861328125, 6.4017333984375, 6.62060546875, 6.8394775390625, 7.058349609375, 7.2772216796875, 7.49609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 16.0, 9.0, 12.0, 20.0, 50.0, 58.0, 91.0, 170.0, 246.0, 338.0, 492.0, 718.0, 1007.0, 1479.0, 2085.0, 2942.0, 4389.0, 6360.0, 9391.0, 13893.0, 20580.0, 31233.0, 48640.0, 80304.0, 138135.0, 213606.0, 182488.0, 107490.0, 63208.0, 39778.0, 25661.0, 17148.0, 11458.0, 7689.0, 5388.0, 3657.0, 2525.0, 1803.0, 1278.0, 859.0, 628.0, 435.0, 295.0, 176.0, 126.0, 65.0, 49.0, 27.0, 15.0, 13.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.84326171875, -0.8167190551757812, -0.7901763916015625, -0.7636337280273438, -0.737091064453125, -0.7105484008789062, -0.6840057373046875, -0.6574630737304688, -0.63092041015625, -0.6043777465820312, -0.5778350830078125, -0.5512924194335938, -0.524749755859375, -0.49820709228515625, -0.4716644287109375, -0.44512176513671875, -0.4185791015625, -0.39203643798828125, -0.3654937744140625, -0.33895111083984375, -0.312408447265625, -0.28586578369140625, -0.2593231201171875, -0.23278045654296875, -0.20623779296875, -0.17969512939453125, -0.1531524658203125, -0.12660980224609375, -0.100067138671875, -0.07352447509765625, -0.0469818115234375, -0.02043914794921875, 0.006103515625, 0.03264617919921875, 0.0591888427734375, 0.08573150634765625, 0.112274169921875, 0.13881683349609375, 0.1653594970703125, 0.19190216064453125, 0.21844482421875, 0.24498748779296875, 0.2715301513671875, 0.29807281494140625, 0.324615478515625, 0.35115814208984375, 0.3777008056640625, 0.40424346923828125, 0.4307861328125, 0.45732879638671875, 0.4838714599609375, 0.5104141235351562, 0.536956787109375, 0.5634994506835938, 0.5900421142578125, 0.6165847778320312, 0.64312744140625, 0.6696701049804688, 0.6962127685546875, 0.7227554321289062, 0.749298095703125, 0.7758407592773438, 0.8023834228515625, 0.8289260864257812, 0.85546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 10.0, 5.0, 14.0, 11.0, 10.0, 13.0, 14.0, 18.0, 24.0, 19.0, 27.0, 26.0, 35.0, 39.0, 33.0, 40.0, 43.0, 48.0, 38.0, 1062.0, 39.0, 39.0, 38.0, 40.0, 22.0, 34.0, 29.0, 31.0, 27.0, 30.0, 31.0, 25.0, 21.0, 16.0, 10.0, 14.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.9454345703125, -3.816650390625, -3.6878662109375, -3.55908203125, -3.4302978515625, -3.301513671875, -3.1727294921875, -3.0439453125, -2.9151611328125, -2.786376953125, -2.6575927734375, -2.52880859375, -2.4000244140625, -2.271240234375, -2.1424560546875, -2.013671875, -1.8848876953125, -1.756103515625, -1.6273193359375, -1.49853515625, -1.3697509765625, -1.240966796875, -1.1121826171875, -0.9833984375, -0.8546142578125, -0.725830078125, -0.5970458984375, -0.46826171875, -0.3394775390625, -0.210693359375, -0.0819091796875, 0.046875, 0.1756591796875, 0.304443359375, 0.4332275390625, 0.56201171875, 0.6907958984375, 0.819580078125, 0.9483642578125, 1.0771484375, 1.2059326171875, 1.334716796875, 1.4635009765625, 1.59228515625, 1.7210693359375, 1.849853515625, 1.9786376953125, 2.107421875, 2.2362060546875, 2.364990234375, 2.4937744140625, 2.62255859375, 2.7513427734375, 2.880126953125, 3.0089111328125, 3.1376953125, 3.2664794921875, 3.395263671875, 3.5240478515625, 3.65283203125, 3.7816162109375, 3.910400390625, 4.0391845703125, 4.16796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 13.0, 25.0, 26.0, 54.0, 57.0, 100.0, 167.0, 264.0, 440.0, 700.0, 1215.0, 2009.0, 3298.0, 5706.0, 10047.0, 17603.0, 31345.0, 57347.0, 107622.0, 197239.0, 1295831.0, 166805.0, 89077.0, 48082.0, 26513.0, 14989.0, 8668.0, 4935.0, 2780.0, 1663.0, 992.0, 585.0, 361.0, 193.0, 141.0, 86.0, 49.0, 33.0, 24.0, 13.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73193359375, -0.70611572265625, -0.6802978515625, -0.65447998046875, -0.628662109375, -0.60284423828125, -0.5770263671875, -0.55120849609375, -0.525390625, -0.49957275390625, -0.4737548828125, -0.44793701171875, -0.422119140625, -0.39630126953125, -0.3704833984375, -0.34466552734375, -0.31884765625, -0.29302978515625, -0.2672119140625, -0.24139404296875, -0.215576171875, -0.18975830078125, -0.1639404296875, -0.13812255859375, -0.1123046875, -0.08648681640625, -0.0606689453125, -0.03485107421875, -0.009033203125, 0.01678466796875, 0.0426025390625, 0.06842041015625, 0.09423828125, 0.12005615234375, 0.1458740234375, 0.17169189453125, 0.197509765625, 0.22332763671875, 0.2491455078125, 0.27496337890625, 0.30078125, 0.32659912109375, 0.3524169921875, 0.37823486328125, 0.404052734375, 0.42987060546875, 0.4556884765625, 0.48150634765625, 0.50732421875, 0.53314208984375, 0.5589599609375, 0.58477783203125, 0.610595703125, 0.63641357421875, 0.6622314453125, 0.68804931640625, 0.7138671875, 0.73968505859375, 0.7655029296875, 0.79132080078125, 0.817138671875, 0.84295654296875, 0.8687744140625, 0.89459228515625, 0.92041015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 7.0, 12.0, 8.0, 18.0, 17.0, 29.0, 20.0, 41.0, 44.0, 44.0, 48.0, 61.0, 63.0, 64.0, 63.0, 59.0, 49.0, 53.0, 54.0, 32.0, 44.0, 24.0, 30.0, 18.0, 19.0, 13.0, 14.0, 9.0, 5.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00217437744140625, -0.002096414566040039, -0.002018451690673828, -0.0019404888153076172, -0.0018625259399414062, -0.0017845630645751953, -0.0017066001892089844, -0.0016286373138427734, -0.0015506744384765625, -0.0014727115631103516, -0.0013947486877441406, -0.0013167858123779297, -0.0012388229370117188, -0.0011608600616455078, -0.0010828971862792969, -0.001004934310913086, -0.000926971435546875, -0.0008490085601806641, -0.0007710456848144531, -0.0006930828094482422, -0.0006151199340820312, -0.0005371570587158203, -0.0004591941833496094, -0.00038123130798339844, -0.0003032684326171875, -0.00022530555725097656, -0.00014734268188476562, -6.937980651855469e-05, 8.58306884765625e-06, 8.654594421386719e-05, 0.00016450881958007812, 0.00024247169494628906, 0.0003204345703125, 0.00039839744567871094, 0.0004763603210449219, 0.0005543231964111328, 0.0006322860717773438, 0.0007102489471435547, 0.0007882118225097656, 0.0008661746978759766, 0.0009441375732421875, 0.0010221004486083984, 0.0011000633239746094, 0.0011780261993408203, 0.0012559890747070312, 0.0013339519500732422, 0.0014119148254394531, 0.001489877700805664, 0.001567840576171875, 0.001645803451538086, 0.0017237663269042969, 0.0018017292022705078, 0.0018796920776367188, 0.0019576549530029297, 0.0020356178283691406, 0.0021135807037353516, 0.0021915435791015625, 0.0022695064544677734, 0.0023474693298339844, 0.0024254322052001953, 0.0025033950805664062, 0.002581357955932617, 0.002659320831298828, 0.002737283706665039, 0.00281524658203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 8.0, 27.0, 21.0, 26.0, 32.0, 46.0, 51.0, 57.0, 94.0, 141.0, 168.0, 249.0, 365.0, 684.0, 2128.0, 859295.0, 182208.0, 1280.0, 562.0, 317.0, 217.0, 134.0, 105.0, 73.0, 57.0, 42.0, 33.0, 20.0, 21.0, 21.0, 10.0, 5.0, 10.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.047515869140625, -0.04615306854248047, -0.04479026794433594, -0.043427467346191406, -0.042064666748046875, -0.040701866149902344, -0.03933906555175781, -0.03797626495361328, -0.03661346435546875, -0.03525066375732422, -0.03388786315917969, -0.032525062561035156, -0.031162261962890625, -0.029799461364746094, -0.028436660766601562, -0.02707386016845703, -0.0257110595703125, -0.02434825897216797, -0.022985458374023438, -0.021622657775878906, -0.020259857177734375, -0.018897056579589844, -0.017534255981445312, -0.01617145538330078, -0.01480865478515625, -0.013445854187011719, -0.012083053588867188, -0.010720252990722656, -0.009357452392578125, -0.007994651794433594, -0.0066318511962890625, -0.005269050598144531, -0.00390625, -0.0025434494018554688, -0.0011806488037109375, 0.00018215179443359375, 0.001544952392578125, 0.0029077529907226562, 0.0042705535888671875, 0.005633354187011719, 0.00699615478515625, 0.008358955383300781, 0.009721755981445312, 0.011084556579589844, 0.012447357177734375, 0.013810157775878906, 0.015172958374023438, 0.01653575897216797, 0.0178985595703125, 0.01926136016845703, 0.020624160766601562, 0.021986961364746094, 0.023349761962890625, 0.024712562561035156, 0.026075363159179688, 0.02743816375732422, 0.02880096435546875, 0.03016376495361328, 0.03152656555175781, 0.032889366149902344, 0.034252166748046875, 0.035614967346191406, 0.03697776794433594, 0.03834056854248047, 0.039703369140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [56.0, 955.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010350876254960895, -0.0002198097645305097, 0.00059546809643507, 0.0014107458991929889, 0.0022260239347815514, 0.0030413013882935047, 0.0038565793074667454, 0.004671857226639986, 0.005487135145813227, 0.006302413064986467, 0.007117690984159708, 0.007932968437671661, 0.008748246356844902, 0.009563524276018143, 0.010378802195191383, 0.011194080114364624, 0.012009358033537865, 0.012824635952711105, 0.013639913871884346, 0.014455191791057587, 0.015270469710230827, 0.016085747629404068, 0.01690102554857731, 0.01771630346775055, 0.01853158138692379, 0.01934685930609703, 0.02016213722527027, 0.020977415144443512, 0.021792693063616753, 0.022607970982789993, 0.023423248901963234, 0.024238526821136475, 0.025053804740309715, 0.025869082659482956, 0.026684360578656197, 0.027499638497829437, 0.028314916417002678, 0.02913019433617592, 0.02994547225534916, 0.0307607501745224, 0.03157602623105049, 0.03239130228757858, 0.03320658206939697, 0.034021858125925064, 0.034837137907743454, 0.035652413964271545, 0.036467693746089935, 0.03728296980261803, 0.03809824958443642, 0.03891352564096451, 0.0397288054227829, 0.04054408147931099, 0.04135936126112938, 0.04217463731765747, 0.04298991709947586, 0.04380519315600395, 0.04462047293782234, 0.04543574899435043, 0.04625102877616882, 0.047066304832696915, 0.047881584614515305, 0.048696860671043396, 0.049512140452861786, 0.05032741650938988, 0.05114269629120827]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 5.0, 8.0, 10.0, 17.0, 26.0, 24.0, 30.0, 29.0, 42.0, 53.0, 62.0, 46.0, 58.0, 73.0, 70.0, 65.0, 44.0, 66.0, 65.0, 50.0, 38.0, 39.0, 23.0, 28.0, 15.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002855837345123291, -0.0027908040210604668, -0.0027257706969976425, -0.0026607373729348183, -0.002595704048871994, -0.0025306707248091698, -0.0024656374007463455, -0.0024006040766835213, -0.002335570752620697, -0.0022705374285578728, -0.0022055041044950485, -0.0021404707804322243, -0.0020754374563694, -0.0020104041323065758, -0.0019453708082437515, -0.0018803374841809273, -0.001815304160118103, -0.0017502708360552788, -0.0016852375119924545, -0.0016202041879296303, -0.001555170863866806, -0.0014901375398039818, -0.0014251042157411575, -0.0013600708916783333, -0.001295037567615509, -0.0012300042435526848, -0.0011649709194898605, -0.0010999375954270363, -0.001034904271364212, -0.0009698709473013878, -0.0009048376232385635, -0.0008398042991757393, -0.000774770975112915, -0.0007097376510500908, -0.0006447043269872665, -0.0005796710029244423, -0.000514637678861618, -0.0004496043547987938, -0.00038457103073596954, -0.0003195377066731453, -0.00025450438261032104, -0.0001894710585474968, -0.00012443773448467255, -5.94044104218483e-05, 5.628913640975952e-06, 7.06622377038002e-05, 0.00013569556176662445, 0.0002007288858294487, 0.00026576220989227295, 0.0003307955339550972, 0.00039582885801792145, 0.0004608621820807457, 0.00052589550614357, 0.0005909288302063942, 0.0006559621542692184, 0.0007209954783320427, 0.0007860288023948669, 0.0008510621264576912, 0.0009160954505205154, 0.0009811287745833397, 0.001046162098646164, 0.0011111954227089882, 0.0011762287467718124, 0.0012412620708346367, 0.001306295394897461]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 20.0, 26.0, 22.0, 23.0, 32.0, 33.0, 30.0, 28.0, 34.0, 37.0, 36.0, 48.0, 55.0, 43.0, 45.0, 41.0, 24.0, 32.0, 41.0, 38.0, 30.0, 22.0, 33.0, 27.0, 29.0, 24.0, 22.0, 17.0, 19.0, 9.0, 3.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.2928466796875, -6.073974609375, -5.8551025390625, -5.63623046875, -5.4173583984375, -5.198486328125, -4.9796142578125, -4.7607421875, -4.5418701171875, -4.322998046875, -4.1041259765625, -3.88525390625, -3.6663818359375, -3.447509765625, -3.2286376953125, -3.009765625, -2.7908935546875, -2.572021484375, -2.3531494140625, -2.13427734375, -1.9154052734375, -1.696533203125, -1.4776611328125, -1.2587890625, -1.0399169921875, -0.821044921875, -0.6021728515625, -0.38330078125, -0.1644287109375, 0.054443359375, 0.2733154296875, 0.4921875, 0.7110595703125, 0.929931640625, 1.1488037109375, 1.36767578125, 1.5865478515625, 1.805419921875, 2.0242919921875, 2.2431640625, 2.4620361328125, 2.680908203125, 2.8997802734375, 3.11865234375, 3.3375244140625, 3.556396484375, 3.7752685546875, 3.994140625, 4.2130126953125, 4.431884765625, 4.6507568359375, 4.86962890625, 5.0885009765625, 5.307373046875, 5.5262451171875, 5.7451171875, 5.9639892578125, 6.182861328125, 6.4017333984375, 6.62060546875, 6.8394775390625, 7.058349609375, 7.2772216796875, 7.49609375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 9.0, 6.0, 15.0, 13.0, 24.0, 30.0, 35.0, 52.0, 56.0, 89.0, 143.0, 190.0, 248.0, 380.0, 492.0, 688.0, 1013.0, 1492.0, 2581.0, 5677.0, 18922.0, 90323.0, 480420.0, 356058.0, 63536.0, 14478.0, 4762.0, 2265.0, 1287.0, 964.0, 647.0, 450.0, 357.0, 258.0, 162.0, 121.0, 87.0, 61.0, 54.0, 38.0, 18.0, 13.0, 13.0, 12.0, 7.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.60107421875, -11.2255859375, -10.85009765625, -10.474609375, -10.09912109375, -9.7236328125, -9.34814453125, -8.97265625, -8.59716796875, -8.2216796875, -7.84619140625, -7.470703125, -7.09521484375, -6.7197265625, -6.34423828125, -5.96875, -5.59326171875, -5.2177734375, -4.84228515625, -4.466796875, -4.09130859375, -3.7158203125, -3.34033203125, -2.96484375, -2.58935546875, -2.2138671875, -1.83837890625, -1.462890625, -1.08740234375, -0.7119140625, -0.33642578125, 0.0390625, 0.41455078125, 0.7900390625, 1.16552734375, 1.541015625, 1.91650390625, 2.2919921875, 2.66748046875, 3.04296875, 3.41845703125, 3.7939453125, 4.16943359375, 4.544921875, 4.92041015625, 5.2958984375, 5.67138671875, 6.046875, 6.42236328125, 6.7978515625, 7.17333984375, 7.548828125, 7.92431640625, 8.2998046875, 8.67529296875, 9.05078125, 9.42626953125, 9.8017578125, 10.17724609375, 10.552734375, 10.92822265625, 11.3037109375, 11.67919921875, 12.0546875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 10.0, 7.0, 9.0, 13.0, 20.0, 15.0, 20.0, 24.0, 22.0, 31.0, 35.0, 31.0, 56.0, 56.0, 74.0, 97.0, 283.0, 1545.0, 174.0, 87.0, 48.0, 52.0, 42.0, 54.0, 38.0, 33.0, 24.0, 19.0, 20.0, 21.0, 11.0, 9.0, 9.0, 5.0, 10.0, 7.0, 2.0, 7.0, 7.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0546875, -14.5211181640625, -13.987548828125, -13.4539794921875, -12.92041015625, -12.3868408203125, -11.853271484375, -11.3197021484375, -10.7861328125, -10.2525634765625, -9.718994140625, -9.1854248046875, -8.65185546875, -8.1182861328125, -7.584716796875, -7.0511474609375, -6.517578125, -5.9840087890625, -5.450439453125, -4.9168701171875, -4.38330078125, -3.8497314453125, -3.316162109375, -2.7825927734375, -2.2490234375, -1.7154541015625, -1.181884765625, -0.6483154296875, -0.11474609375, 0.4188232421875, 0.952392578125, 1.4859619140625, 2.01953125, 2.5531005859375, 3.086669921875, 3.6202392578125, 4.15380859375, 4.6873779296875, 5.220947265625, 5.7545166015625, 6.2880859375, 6.8216552734375, 7.355224609375, 7.8887939453125, 8.42236328125, 8.9559326171875, 9.489501953125, 10.0230712890625, 10.556640625, 11.0902099609375, 11.623779296875, 12.1573486328125, 12.69091796875, 13.2244873046875, 13.758056640625, 14.2916259765625, 14.8251953125, 15.3587646484375, 15.892333984375, 16.4259033203125, 16.95947265625, 17.4930419921875, 18.026611328125, 18.5601806640625, 19.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 14.0, 9.0, 24.0, 18.0, 23.0, 43.0, 50.0, 59.0, 91.0, 151.0, 216.0, 407.0, 813.0, 3367.0, 3101719.0, 36195.0, 1228.0, 491.0, 254.0, 145.0, 108.0, 71.0, 55.0, 29.0, 19.0, 17.0, 13.0, 13.0, 6.0, 13.0, 5.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.75, -64.8271484375, -62.904296875, -60.9814453125, -59.05859375, -57.1357421875, -55.212890625, -53.2900390625, -51.3671875, -49.4443359375, -47.521484375, -45.5986328125, -43.67578125, -41.7529296875, -39.830078125, -37.9072265625, -35.984375, -34.0615234375, -32.138671875, -30.2158203125, -28.29296875, -26.3701171875, -24.447265625, -22.5244140625, -20.6015625, -18.6787109375, -16.755859375, -14.8330078125, -12.91015625, -10.9873046875, -9.064453125, -7.1416015625, -5.21875, -3.2958984375, -1.373046875, 0.5498046875, 2.47265625, 4.3955078125, 6.318359375, 8.2412109375, 10.1640625, 12.0869140625, 14.009765625, 15.9326171875, 17.85546875, 19.7783203125, 21.701171875, 23.6240234375, 25.546875, 27.4697265625, 29.392578125, 31.3154296875, 33.23828125, 35.1611328125, 37.083984375, 39.0068359375, 40.9296875, 42.8525390625, 44.775390625, 46.6982421875, 48.62109375, 50.5439453125, 52.466796875, 54.3896484375, 56.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 48.0, 734.0, 228.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.92311096191406, -202.90771484375, -196.89231872558594, -190.8769073486328, -184.86151123046875, -178.8461151123047, -172.83071899414062, -166.8153076171875, -160.79991149902344, -154.78451538085938, -148.7691192626953, -142.7537078857422, -136.73831176757812, -130.72291564941406, -124.70751953125, -118.6921157836914, -112.67671966552734, -106.66132354736328, -100.64591979980469, -94.63052368164062, -88.61511993408203, -82.59972381591797, -76.58432006835938, -70.56892395019531, -64.55352783203125, -58.53812789916992, -52.522727966308594, -46.50733184814453, -40.49192810058594, -34.476531982421875, -28.461132049560547, -22.44573211669922, -16.430328369140625, -10.414928436279297, -4.399529457092285, 1.6158695220947266, 7.631269454956055, 13.646669387817383, 19.662067413330078, 25.677467346191406, 31.692867279052734, 37.70826721191406, 43.72366714477539, 49.73906707763672, 55.75446319580078, 61.769866943359375, 67.78526306152344, 73.8006591796875, 79.8160629272461, 85.83145904541016, 91.84686279296875, 97.86225891113281, 103.8776626586914, 109.89305877685547, 115.90846252441406, 121.92385864257812, 127.93925476074219, 133.95465087890625, 139.9700469970703, 145.98545837402344, 152.0008544921875, 158.01625061035156, 164.03164672851562, 170.04705810546875, 176.0624542236328]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 12.0, 10.0, 18.0, 23.0, 28.0, 23.0, 25.0, 31.0, 27.0, 32.0, 39.0, 37.0, 44.0, 37.0, 58.0, 48.0, 36.0, 33.0, 37.0, 44.0, 30.0, 30.0, 33.0, 18.0, 35.0, 28.0, 26.0, 25.0, 17.0, 13.0, 13.0, 18.0, 6.0, 6.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.710960388183594, -48.23847198486328, -46.765987396240234, -45.29350280761719, -43.821014404296875, -42.34852600097656, -40.876041412353516, -39.40355682373047, -37.931068420410156, -36.458580017089844, -34.9860954284668, -33.51361083984375, -32.04112243652344, -30.568635940551758, -29.096149444580078, -27.6236629486084, -26.15117645263672, -24.67868995666504, -23.20620346069336, -21.73371696472168, -20.26123046875, -18.78874397277832, -17.31625747680664, -15.843770980834961, -14.371284484863281, -12.898797988891602, -11.426311492919922, -9.953824996948242, -8.481338500976562, -7.008852005004883, -5.536365509033203, -4.063879013061523, -2.5913925170898438, -1.118906021118164, 0.3535804748535156, 1.8260669708251953, 3.298553466796875, 4.771039962768555, 6.243526458740234, 7.716012954711914, 9.188499450683594, 10.660985946655273, 12.133472442626953, 13.605958938598633, 15.078445434570312, 16.550931930541992, 18.023418426513672, 19.49590492248535, 20.96839141845703, 22.44087791442871, 23.91336441040039, 25.38585090637207, 26.85833740234375, 28.33082389831543, 29.80331039428711, 31.27579689025879, 32.74828338623047, 34.22077178955078, 35.69325637817383, 37.165740966796875, 38.63822937011719, 40.1107177734375, 41.58320236206055, 43.055686950683594, 44.528175354003906]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 10.0, 16.0, 13.0, 18.0, 23.0, 18.0, 31.0, 33.0, 39.0, 41.0, 44.0, 51.0, 50.0, 43.0, 46.0, 36.0, 36.0, 58.0, 41.0, 42.0, 33.0, 44.0, 38.0, 27.0, 20.0, 31.0, 15.0, 23.0, 12.0, 15.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.11932373046875, -6.8753662109375, -6.63140869140625, -6.387451171875, -6.14349365234375, -5.8995361328125, -5.65557861328125, -5.41162109375, -5.16766357421875, -4.9237060546875, -4.67974853515625, -4.435791015625, -4.19183349609375, -3.9478759765625, -3.70391845703125, -3.4599609375, -3.21600341796875, -2.9720458984375, -2.72808837890625, -2.484130859375, -2.24017333984375, -1.9962158203125, -1.75225830078125, -1.50830078125, -1.26434326171875, -1.0203857421875, -0.77642822265625, -0.532470703125, -0.28851318359375, -0.0445556640625, 0.19940185546875, 0.443359375, 0.68731689453125, 0.9312744140625, 1.17523193359375, 1.419189453125, 1.66314697265625, 1.9071044921875, 2.15106201171875, 2.39501953125, 2.63897705078125, 2.8829345703125, 3.12689208984375, 3.370849609375, 3.61480712890625, 3.8587646484375, 4.10272216796875, 4.3466796875, 4.59063720703125, 4.8345947265625, 5.07855224609375, 5.322509765625, 5.56646728515625, 5.8104248046875, 6.05438232421875, 6.29833984375, 6.54229736328125, 6.7862548828125, 7.03021240234375, 7.274169921875, 7.51812744140625, 7.7620849609375, 8.00604248046875, 8.25]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 8.0, 18.0, 21.0, 30.0, 32.0, 62.0, 56.0, 86.0, 145.0, 188.0, 264.0, 463.0, 852.0, 2251.0, 7867.0, 59855.0, 1161659.0, 2705491.0, 230804.0, 17412.0, 3745.0, 1320.0, 580.0, 297.0, 210.0, 124.0, 96.0, 83.0, 67.0, 39.0, 36.0, 26.0, 16.0, 19.0, 19.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.362060546875, -14.81787109375, -14.273681640625, -13.7294921875, -13.185302734375, -12.64111328125, -12.096923828125, -11.552734375, -11.008544921875, -10.46435546875, -9.920166015625, -9.3759765625, -8.831787109375, -8.28759765625, -7.743408203125, -7.19921875, -6.655029296875, -6.11083984375, -5.566650390625, -5.0224609375, -4.478271484375, -3.93408203125, -3.389892578125, -2.845703125, -2.301513671875, -1.75732421875, -1.213134765625, -0.6689453125, -0.124755859375, 0.41943359375, 0.963623046875, 1.5078125, 2.052001953125, 2.59619140625, 3.140380859375, 3.6845703125, 4.228759765625, 4.77294921875, 5.317138671875, 5.861328125, 6.405517578125, 6.94970703125, 7.493896484375, 8.0380859375, 8.582275390625, 9.12646484375, 9.670654296875, 10.21484375, 10.759033203125, 11.30322265625, 11.847412109375, 12.3916015625, 12.935791015625, 13.47998046875, 14.024169921875, 14.568359375, 15.112548828125, 15.65673828125, 16.200927734375, 16.7451171875, 17.289306640625, 17.83349609375, 18.377685546875, 18.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 18.0, 13.0, 17.0, 17.0, 28.0, 42.0, 68.0, 76.0, 123.0, 155.0, 228.0, 322.0, 481.0, 637.0, 553.0, 360.0, 218.0, 199.0, 130.0, 84.0, 63.0, 70.0, 48.0, 35.0, 26.0, 15.0, 11.0, 6.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.7265625, -14.33544921875, -13.9443359375, -13.55322265625, -13.162109375, -12.77099609375, -12.3798828125, -11.98876953125, -11.59765625, -11.20654296875, -10.8154296875, -10.42431640625, -10.033203125, -9.64208984375, -9.2509765625, -8.85986328125, -8.46875, -8.07763671875, -7.6865234375, -7.29541015625, -6.904296875, -6.51318359375, -6.1220703125, -5.73095703125, -5.33984375, -4.94873046875, -4.5576171875, -4.16650390625, -3.775390625, -3.38427734375, -2.9931640625, -2.60205078125, -2.2109375, -1.81982421875, -1.4287109375, -1.03759765625, -0.646484375, -0.25537109375, 0.1357421875, 0.52685546875, 0.91796875, 1.30908203125, 1.7001953125, 2.09130859375, 2.482421875, 2.87353515625, 3.2646484375, 3.65576171875, 4.046875, 4.43798828125, 4.8291015625, 5.22021484375, 5.611328125, 6.00244140625, 6.3935546875, 6.78466796875, 7.17578125, 7.56689453125, 7.9580078125, 8.34912109375, 8.740234375, 9.13134765625, 9.5224609375, 9.91357421875, 10.3046875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 13.0, 18.0, 45.0, 51.0, 107.0, 208.0, 473.0, 1244.0, 5797.0, 468210.0, 3691047.0, 23814.0, 2018.0, 649.0, 249.0, 139.0, 75.0, 42.0, 28.0, 18.0, 11.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.96875, -37.72021484375, -36.4716796875, -35.22314453125, -33.974609375, -32.72607421875, -31.4775390625, -30.22900390625, -28.98046875, -27.73193359375, -26.4833984375, -25.23486328125, -23.986328125, -22.73779296875, -21.4892578125, -20.24072265625, -18.9921875, -17.74365234375, -16.4951171875, -15.24658203125, -13.998046875, -12.74951171875, -11.5009765625, -10.25244140625, -9.00390625, -7.75537109375, -6.5068359375, -5.25830078125, -4.009765625, -2.76123046875, -1.5126953125, -0.26416015625, 0.984375, 2.23291015625, 3.4814453125, 4.72998046875, 5.978515625, 7.22705078125, 8.4755859375, 9.72412109375, 10.97265625, 12.22119140625, 13.4697265625, 14.71826171875, 15.966796875, 17.21533203125, 18.4638671875, 19.71240234375, 20.9609375, 22.20947265625, 23.4580078125, 24.70654296875, 25.955078125, 27.20361328125, 28.4521484375, 29.70068359375, 30.94921875, 32.19775390625, 33.4462890625, 34.69482421875, 35.943359375, 37.19189453125, 38.4404296875, 39.68896484375, 40.9375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 65.0, 925.0, 26.0, 4.0, 0.0, 0.0, 1.0], "bins": [-877.8282470703125, -862.8021240234375, -847.7760620117188, -832.75, -817.723876953125, -802.69775390625, -787.6716918945312, -772.6456298828125, -757.6195068359375, -742.5933837890625, -727.5673217773438, -712.541259765625, -697.51513671875, -682.489013671875, -667.4629516601562, -652.4368896484375, -637.4107666015625, -622.3846435546875, -607.3585815429688, -592.33251953125, -577.306396484375, -562.2802734375, -547.2542114257812, -532.2281494140625, -517.2020263671875, -502.1759338378906, -487.14984130859375, -472.1237487792969, -457.09765625, -442.0715637207031, -427.04547119140625, -412.0193786621094, -396.9932861328125, -381.9671936035156, -366.94110107421875, -351.9150085449219, -336.888916015625, -321.8628234863281, -306.83673095703125, -291.8106384277344, -276.7845458984375, -261.7584533691406, -246.73236083984375, -231.70626831054688, -216.68017578125, -201.65408325195312, -186.62799072265625, -171.60189819335938, -156.5758056640625, -141.54971313476562, -126.52362060546875, -111.49752807617188, -96.471435546875, -81.44534301757812, -66.41925048828125, -51.393157958984375, -36.36707305908203, -21.340980529785156, -6.314888000488281, 8.711204528808594, 23.73729705810547, 38.763389587402344, 53.78948211669922, 68.8155746459961, 83.84166717529297]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 4.0, 15.0, 13.0, 12.0, 22.0, 22.0, 23.0, 22.0, 27.0, 31.0, 32.0, 45.0, 46.0, 53.0, 54.0, 38.0, 39.0, 44.0, 46.0, 40.0, 45.0, 48.0, 32.0, 35.0, 27.0, 18.0, 16.0, 13.0, 24.0, 14.0, 13.0, 13.0, 14.0, 12.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21849822998047, -39.870723724365234, -38.52294921875, -37.17517852783203, -35.8274040222168, -34.47962951660156, -33.13185501098633, -31.784080505371094, -30.43630599975586, -29.088531494140625, -27.740758895874023, -26.39298439025879, -25.045209884643555, -23.697437286376953, -22.34966278076172, -21.001888275146484, -19.654115676879883, -18.30634117126465, -16.958568572998047, -15.610794067382812, -14.263019561767578, -12.91524600982666, -11.567472457885742, -10.219697952270508, -8.87192440032959, -7.524150371551514, -6.1763763427734375, -4.8286027908325195, -3.4808287620544434, -2.133054733276367, -0.7852811813354492, 0.5624933242797852, 1.9102668762207031, 3.2580409049987793, 4.6058149337768555, 5.953588485717773, 7.30136251449585, 8.649136543273926, 9.996910095214844, 11.344684600830078, 12.692458152770996, 14.040231704711914, 15.388006210327148, 16.73577880859375, 18.083553314208984, 19.43132781982422, 20.779102325439453, 22.126876831054688, 23.47464942932129, 24.822423934936523, 26.170196533203125, 27.51797103881836, 28.865745544433594, 30.213520050048828, 31.56129264831543, 32.90906524658203, 34.256839752197266, 35.6046142578125, 36.952388763427734, 38.30016326904297, 39.64793395996094, 40.99570846557617, 42.343482971191406, 43.69125747680664, 45.039031982421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 10.0, 8.0, 21.0, 24.0, 23.0, 23.0, 23.0, 35.0, 33.0, 35.0, 46.0, 54.0, 46.0, 46.0, 52.0, 49.0, 54.0, 49.0, 44.0, 39.0, 33.0, 37.0, 29.0, 28.0, 26.0, 27.0, 13.0, 10.0, 18.0, 7.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.56494140625, -6.3759765625, -6.18701171875, -5.998046875, -5.80908203125, -5.6201171875, -5.43115234375, -5.2421875, -5.05322265625, -4.8642578125, -4.67529296875, -4.486328125, -4.29736328125, -4.1083984375, -3.91943359375, -3.73046875, -3.54150390625, -3.3525390625, -3.16357421875, -2.974609375, -2.78564453125, -2.5966796875, -2.40771484375, -2.21875, -2.02978515625, -1.8408203125, -1.65185546875, -1.462890625, -1.27392578125, -1.0849609375, -0.89599609375, -0.70703125, -0.51806640625, -0.3291015625, -0.14013671875, 0.048828125, 0.23779296875, 0.4267578125, 0.61572265625, 0.8046875, 0.99365234375, 1.1826171875, 1.37158203125, 1.560546875, 1.74951171875, 1.9384765625, 2.12744140625, 2.31640625, 2.50537109375, 2.6943359375, 2.88330078125, 3.072265625, 3.26123046875, 3.4501953125, 3.63916015625, 3.828125, 4.01708984375, 4.2060546875, 4.39501953125, 4.583984375, 4.77294921875, 4.9619140625, 5.15087890625, 5.33984375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 7.0, 9.0, 19.0, 22.0, 40.0, 42.0, 66.0, 97.0, 118.0, 189.0, 230.0, 357.0, 487.0, 640.0, 934.0, 1296.0, 1769.0, 2559.0, 3505.0, 5139.0, 7519.0, 11091.0, 17117.0, 26390.0, 42101.0, 69008.0, 118177.0, 191284.0, 203960.0, 133178.0, 77372.0, 46738.0, 29159.0, 18610.0, 12237.0, 8098.0, 5521.0, 3904.0, 2762.0, 1921.0, 1390.0, 944.0, 705.0, 525.0, 375.0, 297.0, 204.0, 131.0, 87.0, 80.0, 44.0, 35.0, 25.0, 15.0, 12.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6020736694335938, -0.5820770263671875, -0.5620803833007812, -0.542083740234375, -0.5220870971679688, -0.5020904541015625, -0.48209381103515625, -0.46209716796875, -0.44210052490234375, -0.4221038818359375, -0.40210723876953125, -0.382110595703125, -0.36211395263671875, -0.3421173095703125, -0.32212066650390625, -0.3021240234375, -0.28212738037109375, -0.2621307373046875, -0.24213409423828125, -0.222137451171875, -0.20214080810546875, -0.1821441650390625, -0.16214752197265625, -0.14215087890625, -0.12215423583984375, -0.1021575927734375, -0.08216094970703125, -0.062164306640625, -0.04216766357421875, -0.0221710205078125, -0.00217437744140625, 0.017822265625, 0.03781890869140625, 0.0578155517578125, 0.07781219482421875, 0.097808837890625, 0.11780548095703125, 0.1378021240234375, 0.15779876708984375, 0.17779541015625, 0.19779205322265625, 0.2177886962890625, 0.23778533935546875, 0.257781982421875, 0.27777862548828125, 0.2977752685546875, 0.31777191162109375, 0.3377685546875, 0.35776519775390625, 0.3777618408203125, 0.39775848388671875, 0.417755126953125, 0.43775177001953125, 0.4577484130859375, 0.47774505615234375, 0.49774169921875, 0.5177383422851562, 0.5377349853515625, 0.5577316284179688, 0.577728271484375, 0.5977249145507812, 0.6177215576171875, 0.6377182006835938, 0.65771484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 6.0, 16.0, 18.0, 17.0, 21.0, 27.0, 27.0, 26.0, 27.0, 29.0, 32.0, 26.0, 38.0, 51.0, 56.0, 46.0, 1070.0, 54.0, 35.0, 38.0, 36.0, 26.0, 38.0, 33.0, 34.0, 33.0, 22.0, 22.0, 18.0, 14.0, 13.0, 12.0, 14.0, 5.0, 12.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.371337890625, -3.26416015625, -3.156982421875, -3.0498046875, -2.942626953125, -2.83544921875, -2.728271484375, -2.62109375, -2.513916015625, -2.40673828125, -2.299560546875, -2.1923828125, -2.085205078125, -1.97802734375, -1.870849609375, -1.763671875, -1.656494140625, -1.54931640625, -1.442138671875, -1.3349609375, -1.227783203125, -1.12060546875, -1.013427734375, -0.90625, -0.799072265625, -0.69189453125, -0.584716796875, -0.4775390625, -0.370361328125, -0.26318359375, -0.156005859375, -0.048828125, 0.058349609375, 0.16552734375, 0.272705078125, 0.3798828125, 0.487060546875, 0.59423828125, 0.701416015625, 0.80859375, 0.915771484375, 1.02294921875, 1.130126953125, 1.2373046875, 1.344482421875, 1.45166015625, 1.558837890625, 1.666015625, 1.773193359375, 1.88037109375, 1.987548828125, 2.0947265625, 2.201904296875, 2.30908203125, 2.416259765625, 2.5234375, 2.630615234375, 2.73779296875, 2.844970703125, 2.9521484375, 3.059326171875, 3.16650390625, 3.273681640625, 3.380859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 5.0, 13.0, 22.0, 23.0, 41.0, 48.0, 97.0, 131.0, 217.0, 311.0, 473.0, 762.0, 1193.0, 1857.0, 3028.0, 4942.0, 7999.0, 13899.0, 23807.0, 40539.0, 71963.0, 126860.0, 217354.0, 1253651.0, 139914.0, 79021.0, 44535.0, 25740.0, 15314.0, 8946.0, 5442.0, 3285.0, 2077.0, 1323.0, 769.0, 559.0, 324.0, 210.0, 152.0, 97.0, 50.0, 45.0, 32.0, 17.0, 13.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.595703125, -0.57769775390625, -0.5596923828125, -0.54168701171875, -0.523681640625, -0.50567626953125, -0.4876708984375, -0.46966552734375, -0.45166015625, -0.43365478515625, -0.4156494140625, -0.39764404296875, -0.379638671875, -0.36163330078125, -0.3436279296875, -0.32562255859375, -0.3076171875, -0.28961181640625, -0.2716064453125, -0.25360107421875, -0.235595703125, -0.21759033203125, -0.1995849609375, -0.18157958984375, -0.16357421875, -0.14556884765625, -0.1275634765625, -0.10955810546875, -0.091552734375, -0.07354736328125, -0.0555419921875, -0.03753662109375, -0.01953125, -0.00152587890625, 0.0164794921875, 0.03448486328125, 0.052490234375, 0.07049560546875, 0.0885009765625, 0.10650634765625, 0.12451171875, 0.14251708984375, 0.1605224609375, 0.17852783203125, 0.196533203125, 0.21453857421875, 0.2325439453125, 0.25054931640625, 0.2685546875, 0.28656005859375, 0.3045654296875, 0.32257080078125, 0.340576171875, 0.35858154296875, 0.3765869140625, 0.39459228515625, 0.41259765625, 0.43060302734375, 0.4486083984375, 0.46661376953125, 0.484619140625, 0.50262451171875, 0.5206298828125, 0.53863525390625, 0.556640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 14.0, 25.0, 22.0, 20.0, 39.0, 40.0, 50.0, 58.0, 53.0, 69.0, 70.0, 60.0, 73.0, 58.0, 58.0, 42.0, 46.0, 43.0, 24.0, 14.0, 17.0, 12.0, 14.0, 7.0, 6.0, 11.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0023441314697265625, -0.0022708475589752197, -0.002197563648223877, -0.002124279737472534, -0.0020509958267211914, -0.0019777119159698486, -0.0019044280052185059, -0.001831144094467163, -0.0017578601837158203, -0.0016845762729644775, -0.0016112923622131348, -0.001538008451461792, -0.0014647245407104492, -0.0013914406299591064, -0.0013181567192077637, -0.001244872808456421, -0.0011715888977050781, -0.0010983049869537354, -0.0010250210762023926, -0.0009517371654510498, -0.000878453254699707, -0.0008051693439483643, -0.0007318854331970215, -0.0006586015224456787, -0.0005853176116943359, -0.0005120337009429932, -0.0004387497901916504, -0.0003654658794403076, -0.00029218196868896484, -0.00021889805793762207, -0.0001456141471862793, -7.233023643493652e-05, 9.5367431640625e-07, 7.423758506774902e-05, 0.0001475214958190918, 0.00022080540657043457, 0.00029408931732177734, 0.0003673732280731201, 0.0004406571388244629, 0.0005139410495758057, 0.0005872249603271484, 0.0006605088710784912, 0.000733792781829834, 0.0008070766925811768, 0.0008803606033325195, 0.0009536445140838623, 0.001026928424835205, 0.0011002123355865479, 0.0011734962463378906, 0.0012467801570892334, 0.0013200640678405762, 0.001393347978591919, 0.0014666318893432617, 0.0015399158000946045, 0.0016131997108459473, 0.00168648362159729, 0.0017597675323486328, 0.0018330514430999756, 0.0019063353538513184, 0.001979619264602661, 0.002052903175354004, 0.0021261870861053467, 0.0021994709968566895, 0.0022727549076080322, 0.002346038818359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 5.0, 11.0, 18.0, 23.0, 28.0, 30.0, 42.0, 49.0, 79.0, 132.0, 176.0, 300.0, 453.0, 928.0, 21364.0, 1020948.0, 2171.0, 636.0, 362.0, 213.0, 158.0, 97.0, 81.0, 66.0, 47.0, 32.0, 25.0, 13.0, 15.0, 10.0, 3.0, 6.0, 2.0, 0.0, 7.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.045317649841308594, -0.04382133483886719, -0.04232501983642578, -0.040828704833984375, -0.03933238983154297, -0.03783607482910156, -0.036339759826660156, -0.03484344482421875, -0.033347129821777344, -0.03185081481933594, -0.03035449981689453, -0.028858184814453125, -0.02736186981201172, -0.025865554809570312, -0.024369239807128906, -0.0228729248046875, -0.021376609802246094, -0.019880294799804688, -0.01838397979736328, -0.016887664794921875, -0.015391349792480469, -0.013895034790039062, -0.012398719787597656, -0.01090240478515625, -0.009406089782714844, -0.007909774780273438, -0.006413459777832031, -0.004917144775390625, -0.0034208297729492188, -0.0019245147705078125, -0.00042819976806640625, 0.001068115234375, 0.0025644302368164062, 0.0040607452392578125, 0.005557060241699219, 0.007053375244140625, 0.008549690246582031, 0.010046005249023438, 0.011542320251464844, 0.01303863525390625, 0.014534950256347656, 0.016031265258789062, 0.01752758026123047, 0.019023895263671875, 0.02052021026611328, 0.022016525268554688, 0.023512840270996094, 0.0250091552734375, 0.026505470275878906, 0.028001785278320312, 0.02949810028076172, 0.030994415283203125, 0.03249073028564453, 0.03398704528808594, 0.035483360290527344, 0.03697967529296875, 0.038475990295410156, 0.03997230529785156, 0.04146862030029297, 0.042964935302734375, 0.04446125030517578, 0.04595756530761719, 0.047453880310058594, 0.0489501953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 752.0, 263.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011446215212345123, -0.00053387664956972, 7.686822209507227e-05, 0.0006876131519675255, 0.0012983579654246569, 0.0019091027788817883, 0.0025198478251695633, 0.003130592405796051, 0.003741337452083826, 0.004352082498371601, 0.004962827078998089, 0.005573572125285864, 0.006184317171573639, 0.006795061752200127, 0.007405806798487902, 0.008016550913453102, 0.008627296425402164, 0.009238041006028652, 0.009848786517977715, 0.010459531098604202, 0.01107027567923069, 0.011681020259857178, 0.01229176577180624, 0.012902510352432728, 0.01351325586438179, 0.014124000445008278, 0.01473474595695734, 0.015345490537583828, 0.01595623604953289, 0.016566980630159378, 0.017177725210785866, 0.017788469791412354, 0.01839921437203884, 0.01900995895266533, 0.019620703533291817, 0.020231448113918304, 0.02084219455718994, 0.02145293913781643, 0.022063683718442917, 0.022674428299069405, 0.023285172879695892, 0.02389591746032238, 0.024506662040948868, 0.025117408484220505, 0.025728153064846992, 0.02633889764547348, 0.026949642226099968, 0.027560386806726456, 0.028171133249998093, 0.02878187783062458, 0.029392622411251068, 0.030003368854522705, 0.030614113435149193, 0.03122485801577568, 0.03183560073375702, 0.032446347177028656, 0.033057089895009995, 0.03366783633828163, 0.03427857905626297, 0.03488932549953461, 0.035500068217515945, 0.03611081466078758, 0.03672155737876892, 0.03733230382204056, 0.037943050265312195]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 15.0, 17.0, 29.0, 29.0, 35.0, 40.0, 44.0, 43.0, 52.0, 59.0, 50.0, 57.0, 62.0, 51.0, 49.0, 43.0, 50.0, 40.0, 30.0, 35.0, 27.0, 27.0, 24.0, 14.0, 19.0, 11.0, 7.0, 7.0, 1.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0020979642868041992, -0.002047979272902012, -0.0019979942589998245, -0.0019480092450976372, -0.0018980242311954498, -0.0018480392172932625, -0.0017980542033910751, -0.0017480691894888878, -0.0016980841755867004, -0.001648099161684513, -0.0015981141477823257, -0.0015481291338801384, -0.001498144119977951, -0.0014481591060757637, -0.0013981740921735764, -0.001348189078271389, -0.0012982040643692017, -0.0012482190504670143, -0.001198234036564827, -0.0011482490226626396, -0.0010982640087604523, -0.001048278994858265, -0.0009982939809560776, -0.0009483089670538902, -0.0008983239531517029, -0.0008483389392495155, -0.0007983539253473282, -0.0007483689114451408, -0.0006983838975429535, -0.0006483988836407661, -0.0005984138697385788, -0.0005484288558363914, -0.0004984438419342041, -0.00044845882803201675, -0.0003984738141298294, -0.00034848880022764206, -0.0002985037863254547, -0.00024851877242326736, -0.00019853375852108002, -0.00014854874461889267, -9.856373071670532e-05, -4.8578716814517975e-05, 1.4062970876693726e-06, 5.139131098985672e-05, 0.00010137632489204407, 0.00015136133879423141, 0.00020134635269641876, 0.0002513313665986061, 0.00030131638050079346, 0.0003513013944029808, 0.00040128640830516815, 0.0004512714222073555, 0.0005012564361095428, 0.0005512414500117302, 0.0006012264639139175, 0.0006512114778161049, 0.0007011964917182922, 0.0007511815056204796, 0.0008011665195226669, 0.0008511515334248543, 0.0009011365473270416, 0.000951121561229229, 0.0010011065751314163, 0.0010510915890336037, 0.001101076602935791]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 10.0, 8.0, 21.0, 24.0, 23.0, 23.0, 23.0, 35.0, 33.0, 35.0, 46.0, 54.0, 46.0, 46.0, 52.0, 49.0, 54.0, 49.0, 44.0, 39.0, 33.0, 37.0, 29.0, 28.0, 26.0, 27.0, 13.0, 10.0, 18.0, 7.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.56494140625, -6.3759765625, -6.18701171875, -5.998046875, -5.80908203125, -5.6201171875, -5.43115234375, -5.2421875, -5.05322265625, -4.8642578125, -4.67529296875, -4.486328125, -4.29736328125, -4.1083984375, -3.91943359375, -3.73046875, -3.54150390625, -3.3525390625, -3.16357421875, -2.974609375, -2.78564453125, -2.5966796875, -2.40771484375, -2.21875, -2.02978515625, -1.8408203125, -1.65185546875, -1.462890625, -1.27392578125, -1.0849609375, -0.89599609375, -0.70703125, -0.51806640625, -0.3291015625, -0.14013671875, 0.048828125, 0.23779296875, 0.4267578125, 0.61572265625, 0.8046875, 0.99365234375, 1.1826171875, 1.37158203125, 1.560546875, 1.74951171875, 1.9384765625, 2.12744140625, 2.31640625, 2.50537109375, 2.6943359375, 2.88330078125, 3.072265625, 3.26123046875, 3.4501953125, 3.63916015625, 3.828125, 4.01708984375, 4.2060546875, 4.39501953125, 4.583984375, 4.77294921875, 4.9619140625, 5.15087890625, 5.33984375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 3.0, 5.0, 5.0, 10.0, 11.0, 23.0, 28.0, 27.0, 61.0, 82.0, 119.0, 169.0, 253.0, 374.0, 566.0, 819.0, 1424.0, 2236.0, 4419.0, 11927.0, 76621.0, 718412.0, 197393.0, 20207.0, 5856.0, 2928.0, 1537.0, 1019.0, 685.0, 449.0, 248.0, 199.0, 139.0, 103.0, 63.0, 35.0, 34.0, 13.0, 19.0, 15.0, 11.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.28564453125, -12.8056640625, -12.32568359375, -11.845703125, -11.36572265625, -10.8857421875, -10.40576171875, -9.92578125, -9.44580078125, -8.9658203125, -8.48583984375, -8.005859375, -7.52587890625, -7.0458984375, -6.56591796875, -6.0859375, -5.60595703125, -5.1259765625, -4.64599609375, -4.166015625, -3.68603515625, -3.2060546875, -2.72607421875, -2.24609375, -1.76611328125, -1.2861328125, -0.80615234375, -0.326171875, 0.15380859375, 0.6337890625, 1.11376953125, 1.59375, 2.07373046875, 2.5537109375, 3.03369140625, 3.513671875, 3.99365234375, 4.4736328125, 4.95361328125, 5.43359375, 5.91357421875, 6.3935546875, 6.87353515625, 7.353515625, 7.83349609375, 8.3134765625, 8.79345703125, 9.2734375, 9.75341796875, 10.2333984375, 10.71337890625, 11.193359375, 11.67333984375, 12.1533203125, 12.63330078125, 13.11328125, 13.59326171875, 14.0732421875, 14.55322265625, 15.033203125, 15.51318359375, 15.9931640625, 16.47314453125, 16.953125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 3.0, 7.0, 10.0, 12.0, 13.0, 19.0, 21.0, 25.0, 23.0, 42.0, 41.0, 30.0, 52.0, 57.0, 83.0, 215.0, 1654.0, 246.0, 89.0, 63.0, 51.0, 48.0, 37.0, 39.0, 20.0, 26.0, 25.0, 12.0, 12.0, 13.0, 9.0, 8.0, 4.0, 11.0, 5.0, 8.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.03125, -13.556640625, -13.08203125, -12.607421875, -12.1328125, -11.658203125, -11.18359375, -10.708984375, -10.234375, -9.759765625, -9.28515625, -8.810546875, -8.3359375, -7.861328125, -7.38671875, -6.912109375, -6.4375, -5.962890625, -5.48828125, -5.013671875, -4.5390625, -4.064453125, -3.58984375, -3.115234375, -2.640625, -2.166015625, -1.69140625, -1.216796875, -0.7421875, -0.267578125, 0.20703125, 0.681640625, 1.15625, 1.630859375, 2.10546875, 2.580078125, 3.0546875, 3.529296875, 4.00390625, 4.478515625, 4.953125, 5.427734375, 5.90234375, 6.376953125, 6.8515625, 7.326171875, 7.80078125, 8.275390625, 8.75, 9.224609375, 9.69921875, 10.173828125, 10.6484375, 11.123046875, 11.59765625, 12.072265625, 12.546875, 13.021484375, 13.49609375, 13.970703125, 14.4453125, 14.919921875, 15.39453125, 15.869140625, 16.34375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 10.0, 13.0, 11.0, 20.0, 32.0, 26.0, 38.0, 45.0, 73.0, 70.0, 119.0, 167.0, 257.0, 492.0, 1067.0, 9359.0, 3118035.0, 13236.0, 1197.0, 496.0, 252.0, 183.0, 115.0, 92.0, 71.0, 56.0, 30.0, 28.0, 30.0, 25.0, 14.0, 6.0, 3.0, 2.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.8125, -42.4658203125, -41.119140625, -39.7724609375, -38.42578125, -37.0791015625, -35.732421875, -34.3857421875, -33.0390625, -31.6923828125, -30.345703125, -28.9990234375, -27.65234375, -26.3056640625, -24.958984375, -23.6123046875, -22.265625, -20.9189453125, -19.572265625, -18.2255859375, -16.87890625, -15.5322265625, -14.185546875, -12.8388671875, -11.4921875, -10.1455078125, -8.798828125, -7.4521484375, -6.10546875, -4.7587890625, -3.412109375, -2.0654296875, -0.71875, 0.6279296875, 1.974609375, 3.3212890625, 4.66796875, 6.0146484375, 7.361328125, 8.7080078125, 10.0546875, 11.4013671875, 12.748046875, 14.0947265625, 15.44140625, 16.7880859375, 18.134765625, 19.4814453125, 20.828125, 22.1748046875, 23.521484375, 24.8681640625, 26.21484375, 27.5615234375, 28.908203125, 30.2548828125, 31.6015625, 32.9482421875, 34.294921875, 35.6416015625, 36.98828125, 38.3349609375, 39.681640625, 41.0283203125, 42.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 20.0, 77.0, 179.0, 333.0, 257.0, 88.0, 39.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.76789093017578, -79.79903411865234, -77.8301773071289, -75.86132049560547, -73.89246368408203, -71.9236068725586, -69.95475006103516, -67.98589324951172, -66.01703643798828, -64.04817962646484, -62.079322814941406, -60.11046600341797, -58.14160919189453, -56.172752380371094, -54.203895568847656, -52.23503875732422, -50.26618194580078, -48.297325134277344, -46.328468322753906, -44.35961151123047, -42.39075469970703, -40.421897888183594, -38.453041076660156, -36.48418426513672, -34.51533126831055, -32.54647445678711, -30.577617645263672, -28.608760833740234, -26.639904022216797, -24.67104721069336, -22.702190399169922, -20.733333587646484, -18.764476776123047, -16.79561996459961, -14.826763153076172, -12.857906341552734, -10.889049530029297, -8.920193672180176, -6.951336860656738, -4.982480049133301, -3.0136232376098633, -1.0447665452957153, 0.9240901470184326, 2.892946720123291, 4.8618035316467285, 6.830659866333008, 8.799516677856445, 10.768373489379883, 12.73723030090332, 14.706087112426758, 16.674943923950195, 18.643800735473633, 20.61265754699707, 22.581512451171875, 24.550369262695312, 26.51922607421875, 28.488082885742188, 30.456939697265625, 32.42579650878906, 34.3946533203125, 36.36351013183594, 38.332366943359375, 40.30122375488281, 42.27008056640625, 44.23893737792969]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 10.0, 12.0, 14.0, 12.0, 22.0, 21.0, 37.0, 30.0, 35.0, 36.0, 36.0, 34.0, 58.0, 54.0, 48.0, 46.0, 46.0, 46.0, 37.0, 41.0, 45.0, 36.0, 34.0, 36.0, 23.0, 15.0, 18.0, 18.0, 18.0, 19.0, 13.0, 9.0, 2.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.32217788696289, -34.93650817871094, -33.55084228515625, -32.1651725769043, -30.779502868652344, -29.393835067749023, -28.008167266845703, -26.62249755859375, -25.23682975769043, -23.85116195678711, -22.465492248535156, -21.079824447631836, -19.694156646728516, -18.308486938476562, -16.922819137573242, -15.537150382995605, -14.151481628417969, -12.765812873840332, -11.380144119262695, -9.994476318359375, -8.608807563781738, -7.223138809204102, -5.837471008300781, -4.4518022537231445, -3.066133499145508, -1.6804649829864502, -0.2947964668273926, 1.090871810913086, 2.4765405654907227, 3.8622093200683594, 5.24787712097168, 6.633545875549316, 8.019218444824219, 9.404887199401855, 10.790555953979492, 12.176223754882812, 13.56189250946045, 14.947561264038086, 16.333229064941406, 17.71889877319336, 19.10456657409668, 20.490234375, 21.875904083251953, 23.261571884155273, 24.647239685058594, 26.032909393310547, 27.418577194213867, 28.804244995117188, 30.18991470336914, 31.57558250427246, 32.96125030517578, 34.346920013427734, 35.73258972167969, 37.118255615234375, 38.50392532348633, 39.88959503173828, 41.27526092529297, 42.66093063354492, 44.04659652709961, 45.43226623535156, 46.817935943603516, 48.20360565185547, 49.589271545410156, 50.97494125366211, 52.36061096191406]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 6.0, 7.0, 13.0, 20.0, 21.0, 14.0, 25.0, 37.0, 27.0, 39.0, 46.0, 52.0, 52.0, 56.0, 55.0, 50.0, 48.0, 52.0, 52.0, 37.0, 40.0, 43.0, 33.0, 23.0, 33.0, 25.0, 18.0, 15.0, 9.0, 7.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-8.4453125, -8.23016357421875, -8.0150146484375, -7.79986572265625, -7.584716796875, -7.36956787109375, -7.1544189453125, -6.93927001953125, -6.72412109375, -6.50897216796875, -6.2938232421875, -6.07867431640625, -5.863525390625, -5.64837646484375, -5.4332275390625, -5.21807861328125, -5.0029296875, -4.78778076171875, -4.5726318359375, -4.35748291015625, -4.142333984375, -3.92718505859375, -3.7120361328125, -3.49688720703125, -3.28173828125, -3.06658935546875, -2.8514404296875, -2.63629150390625, -2.421142578125, -2.20599365234375, -1.9908447265625, -1.77569580078125, -1.560546875, -1.34539794921875, -1.1302490234375, -0.91510009765625, -0.699951171875, -0.48480224609375, -0.2696533203125, -0.05450439453125, 0.16064453125, 0.37579345703125, 0.5909423828125, 0.80609130859375, 1.021240234375, 1.23638916015625, 1.4515380859375, 1.66668701171875, 1.8818359375, 2.09698486328125, 2.3121337890625, 2.52728271484375, 2.742431640625, 2.95758056640625, 3.1727294921875, 3.38787841796875, 3.60302734375, 3.81817626953125, 4.0333251953125, 4.24847412109375, 4.463623046875, 4.67877197265625, 4.8939208984375, 5.10906982421875, 5.32421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 5.0, 10.0, 11.0, 14.0, 18.0, 25.0, 36.0, 40.0, 60.0, 61.0, 107.0, 166.0, 196.0, 319.0, 512.0, 774.0, 1377.0, 2452.0, 4824.0, 10949.0, 38124.0, 260956.0, 1456664.0, 1921304.0, 407484.0, 60104.0, 14695.0, 6000.0, 2836.0, 1574.0, 913.0, 556.0, 351.0, 231.0, 152.0, 105.0, 81.0, 45.0, 41.0, 21.0, 14.0, 32.0, 14.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.5, -9.2215576171875, -8.943115234375, -8.6646728515625, -8.38623046875, -8.1077880859375, -7.829345703125, -7.5509033203125, -7.2724609375, -6.9940185546875, -6.715576171875, -6.4371337890625, -6.15869140625, -5.8802490234375, -5.601806640625, -5.3233642578125, -5.044921875, -4.7664794921875, -4.488037109375, -4.2095947265625, -3.93115234375, -3.6527099609375, -3.374267578125, -3.0958251953125, -2.8173828125, -2.5389404296875, -2.260498046875, -1.9820556640625, -1.70361328125, -1.4251708984375, -1.146728515625, -0.8682861328125, -0.58984375, -0.3114013671875, -0.032958984375, 0.2454833984375, 0.52392578125, 0.8023681640625, 1.080810546875, 1.3592529296875, 1.6376953125, 1.9161376953125, 2.194580078125, 2.4730224609375, 2.75146484375, 3.0299072265625, 3.308349609375, 3.5867919921875, 3.865234375, 4.1436767578125, 4.422119140625, 4.7005615234375, 4.97900390625, 5.2574462890625, 5.535888671875, 5.8143310546875, 6.0927734375, 6.3712158203125, 6.649658203125, 6.9281005859375, 7.20654296875, 7.4849853515625, 7.763427734375, 8.0418701171875, 8.3203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 19.0, 86.0, 247.0, 625.0, 1685.0, 956.0, 328.0, 94.0, 19.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.34619140625, -31.2548828125, -30.16357421875, -29.072265625, -27.98095703125, -26.8896484375, -25.79833984375, -24.70703125, -23.61572265625, -22.5244140625, -21.43310546875, -20.341796875, -19.25048828125, -18.1591796875, -17.06787109375, -15.9765625, -14.88525390625, -13.7939453125, -12.70263671875, -11.611328125, -10.52001953125, -9.4287109375, -8.33740234375, -7.24609375, -6.15478515625, -5.0634765625, -3.97216796875, -2.880859375, -1.78955078125, -0.6982421875, 0.39306640625, 1.484375, 2.57568359375, 3.6669921875, 4.75830078125, 5.849609375, 6.94091796875, 8.0322265625, 9.12353515625, 10.21484375, 11.30615234375, 12.3974609375, 13.48876953125, 14.580078125, 15.67138671875, 16.7626953125, 17.85400390625, 18.9453125, 20.03662109375, 21.1279296875, 22.21923828125, 23.310546875, 24.40185546875, 25.4931640625, 26.58447265625, 27.67578125, 28.76708984375, 29.8583984375, 30.94970703125, 32.041015625, 33.13232421875, 34.2236328125, 35.31494140625, 36.40625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 28.0, 56.0, 175.0, 565.0, 1972.0, 73297.0, 4111303.0, 5234.0, 1072.0, 318.0, 126.0, 50.0, 21.0, 12.0, 5.0, 7.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0625, -53.30078125, -51.5390625, -49.77734375, -48.015625, -46.25390625, -44.4921875, -42.73046875, -40.96875, -39.20703125, -37.4453125, -35.68359375, -33.921875, -32.16015625, -30.3984375, -28.63671875, -26.875, -25.11328125, -23.3515625, -21.58984375, -19.828125, -18.06640625, -16.3046875, -14.54296875, -12.78125, -11.01953125, -9.2578125, -7.49609375, -5.734375, -3.97265625, -2.2109375, -0.44921875, 1.3125, 3.07421875, 4.8359375, 6.59765625, 8.359375, 10.12109375, 11.8828125, 13.64453125, 15.40625, 17.16796875, 18.9296875, 20.69140625, 22.453125, 24.21484375, 25.9765625, 27.73828125, 29.5, 31.26171875, 33.0234375, 34.78515625, 36.546875, 38.30859375, 40.0703125, 41.83203125, 43.59375, 45.35546875, 47.1171875, 48.87890625, 50.640625, 52.40234375, 54.1640625, 55.92578125, 57.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 37.0, 278.0, 505.0, 174.0, 14.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.3079833984375, -119.59233093261719, -114.8766860961914, -110.16104125976562, -105.44538879394531, -100.729736328125, -96.01409149169922, -91.29844665527344, -86.58279418945312, -81.86714172363281, -77.15149688720703, -72.43585205078125, -67.72019958496094, -63.00455093383789, -58.288902282714844, -53.5732536315918, -48.85760498046875, -44.1419563293457, -39.426307678222656, -34.71065902709961, -29.995010375976562, -25.279361724853516, -20.56371307373047, -15.848064422607422, -11.132415771484375, -6.416767120361328, -1.7011184692382812, 3.0145301818847656, 7.7301788330078125, 12.44582748413086, 17.161476135253906, 21.877124786376953, 26.592758178710938, 31.308406829833984, 36.02405548095703, 40.73970413208008, 45.455352783203125, 50.17100143432617, 54.88665008544922, 59.602298736572266, 64.31794738769531, 69.03359985351562, 73.7492446899414, 78.46488952636719, 83.1805419921875, 87.89619445800781, 92.6118392944336, 97.32748413085938, 102.04313659667969, 106.7587890625, 111.47443389892578, 116.19007873535156, 120.90573120117188, 125.62138366699219, 130.3370361328125, 135.05267333984375, 139.76832580566406, 144.48397827148438, 149.19961547851562, 153.91526794433594, 158.63092041015625, 163.34657287597656, 168.06222534179688, 172.77786254882812, 177.49351501464844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 5.0, 6.0, 7.0, 19.0, 19.0, 13.0, 24.0, 26.0, 26.0, 28.0, 29.0, 47.0, 41.0, 51.0, 37.0, 42.0, 39.0, 57.0, 42.0, 42.0, 44.0, 46.0, 41.0, 24.0, 39.0, 29.0, 28.0, 20.0, 18.0, 9.0, 16.0, 12.0, 8.0, 16.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.028053283691406, -37.715789794921875, -36.403526306152344, -35.09126281738281, -33.77899932861328, -32.46673583984375, -31.154470443725586, -29.842205047607422, -28.52994155883789, -27.21767807006836, -25.905414581298828, -24.593151092529297, -23.280885696411133, -21.9686222076416, -20.65635871887207, -19.344093322753906, -18.031831741333008, -16.719568252563477, -15.407303810119629, -14.095040321350098, -12.78277587890625, -11.470512390136719, -10.158248901367188, -8.84598445892334, -7.533720970153809, -6.221457004547119, -4.90919303894043, -3.5969295501708984, -2.284665584564209, -0.9724016189575195, 0.3398618698120117, 1.6521263122558594, 2.9643898010253906, 4.27665376663208, 5.5889177322387695, 6.901181221008301, 8.213445663452148, 9.52570915222168, 10.837972640991211, 12.150237083435059, 13.46250057220459, 14.774764060974121, 16.08702850341797, 17.3992919921875, 18.71155548095703, 20.023818969726562, 21.336082458496094, 22.648347854614258, 23.96061134338379, 25.27287483215332, 26.58513832092285, 27.897403717041016, 29.209667205810547, 30.521930694580078, 31.83419418334961, 33.14645767211914, 34.45872116088867, 35.7709846496582, 37.083248138427734, 38.395511627197266, 39.7077751159668, 41.020042419433594, 42.332305908203125, 43.644569396972656, 44.95683288574219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 10.0, 4.0, 8.0, 9.0, 11.0, 8.0, 13.0, 17.0, 14.0, 15.0, 30.0, 29.0, 27.0, 33.0, 24.0, 43.0, 29.0, 30.0, 41.0, 33.0, 40.0, 48.0, 47.0, 43.0, 48.0, 39.0, 36.0, 34.0, 32.0, 35.0, 23.0, 24.0, 25.0, 10.0, 14.0, 10.0, 9.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.8359375, -3.70758056640625, -3.5792236328125, -3.45086669921875, -3.322509765625, -3.19415283203125, -3.0657958984375, -2.93743896484375, -2.80908203125, -2.68072509765625, -2.5523681640625, -2.42401123046875, -2.295654296875, -2.16729736328125, -2.0389404296875, -1.91058349609375, -1.7822265625, -1.65386962890625, -1.5255126953125, -1.39715576171875, -1.268798828125, -1.14044189453125, -1.0120849609375, -0.88372802734375, -0.75537109375, -0.62701416015625, -0.4986572265625, -0.37030029296875, -0.241943359375, -0.11358642578125, 0.0147705078125, 0.14312744140625, 0.271484375, 0.39984130859375, 0.5281982421875, 0.65655517578125, 0.784912109375, 0.91326904296875, 1.0416259765625, 1.16998291015625, 1.29833984375, 1.42669677734375, 1.5550537109375, 1.68341064453125, 1.811767578125, 1.94012451171875, 2.0684814453125, 2.19683837890625, 2.3251953125, 2.45355224609375, 2.5819091796875, 2.71026611328125, 2.838623046875, 2.96697998046875, 3.0953369140625, 3.22369384765625, 3.35205078125, 3.48040771484375, 3.6087646484375, 3.73712158203125, 3.865478515625, 3.99383544921875, 4.1221923828125, 4.25054931640625, 4.37890625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 17.0, 18.0, 12.0, 34.0, 47.0, 88.0, 114.0, 157.0, 199.0, 313.0, 403.0, 595.0, 883.0, 1269.0, 1951.0, 2957.0, 4450.0, 6854.0, 10989.0, 17409.0, 29387.0, 52234.0, 97966.0, 185731.0, 255804.0, 169070.0, 89091.0, 47916.0, 26940.0, 16506.0, 10110.0, 6404.0, 4039.0, 2824.0, 1875.0, 1231.0, 834.0, 591.0, 349.0, 259.0, 174.0, 136.0, 115.0, 73.0, 49.0, 30.0, 24.0, 15.0, 12.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58935546875, -0.5699844360351562, -0.5506134033203125, -0.5312423706054688, -0.511871337890625, -0.49250030517578125, -0.4731292724609375, -0.45375823974609375, -0.43438720703125, -0.41501617431640625, -0.3956451416015625, -0.37627410888671875, -0.356903076171875, -0.33753204345703125, -0.3181610107421875, -0.29878997802734375, -0.2794189453125, -0.26004791259765625, -0.2406768798828125, -0.22130584716796875, -0.201934814453125, -0.18256378173828125, -0.1631927490234375, -0.14382171630859375, -0.12445068359375, -0.10507965087890625, -0.0857086181640625, -0.06633758544921875, -0.046966552734375, -0.02759552001953125, -0.0082244873046875, 0.01114654541015625, 0.030517578125, 0.04988861083984375, 0.0692596435546875, 0.08863067626953125, 0.108001708984375, 0.12737274169921875, 0.1467437744140625, 0.16611480712890625, 0.18548583984375, 0.20485687255859375, 0.2242279052734375, 0.24359893798828125, 0.262969970703125, 0.28234100341796875, 0.3017120361328125, 0.32108306884765625, 0.3404541015625, 0.35982513427734375, 0.3791961669921875, 0.39856719970703125, 0.417938232421875, 0.43730926513671875, 0.4566802978515625, 0.47605133056640625, 0.49542236328125, 0.5147933959960938, 0.5341644287109375, 0.5535354614257812, 0.572906494140625, 0.5922775268554688, 0.6116485595703125, 0.6310195922851562, 0.650390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 6.0, 10.0, 11.0, 14.0, 22.0, 18.0, 23.0, 29.0, 28.0, 35.0, 29.0, 33.0, 31.0, 31.0, 40.0, 35.0, 41.0, 40.0, 1072.0, 41.0, 34.0, 39.0, 31.0, 35.0, 31.0, 22.0, 26.0, 22.0, 27.0, 21.0, 16.0, 16.0, 13.0, 15.0, 10.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.859375, -2.778076171875, -2.69677734375, -2.615478515625, -2.5341796875, -2.452880859375, -2.37158203125, -2.290283203125, -2.208984375, -2.127685546875, -2.04638671875, -1.965087890625, -1.8837890625, -1.802490234375, -1.72119140625, -1.639892578125, -1.55859375, -1.477294921875, -1.39599609375, -1.314697265625, -1.2333984375, -1.152099609375, -1.07080078125, -0.989501953125, -0.908203125, -0.826904296875, -0.74560546875, -0.664306640625, -0.5830078125, -0.501708984375, -0.42041015625, -0.339111328125, -0.2578125, -0.176513671875, -0.09521484375, -0.013916015625, 0.0673828125, 0.148681640625, 0.22998046875, 0.311279296875, 0.392578125, 0.473876953125, 0.55517578125, 0.636474609375, 0.7177734375, 0.799072265625, 0.88037109375, 0.961669921875, 1.04296875, 1.124267578125, 1.20556640625, 1.286865234375, 1.3681640625, 1.449462890625, 1.53076171875, 1.612060546875, 1.693359375, 1.774658203125, 1.85595703125, 1.937255859375, 2.0185546875, 2.099853515625, 2.18115234375, 2.262451171875, 2.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 21.0, 20.0, 37.0, 62.0, 90.0, 128.0, 225.0, 348.0, 599.0, 958.0, 1519.0, 2646.0, 4361.0, 7299.0, 12503.0, 21733.0, 37855.0, 69330.0, 127592.0, 230837.0, 1267561.0, 139119.0, 74551.0, 41511.0, 23384.0, 13296.0, 7764.0, 4641.0, 2717.0, 1701.0, 1027.0, 642.0, 345.0, 251.0, 162.0, 85.0, 73.0, 43.0, 28.0, 18.0, 9.0, 9.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5283203125, -0.5113143920898438, -0.4943084716796875, -0.47730255126953125, -0.460296630859375, -0.44329071044921875, -0.4262847900390625, -0.40927886962890625, -0.39227294921875, -0.37526702880859375, -0.3582611083984375, -0.34125518798828125, -0.324249267578125, -0.30724334716796875, -0.2902374267578125, -0.27323150634765625, -0.2562255859375, -0.23921966552734375, -0.2222137451171875, -0.20520782470703125, -0.188201904296875, -0.17119598388671875, -0.1541900634765625, -0.13718414306640625, -0.12017822265625, -0.10317230224609375, -0.0861663818359375, -0.06916046142578125, -0.052154541015625, -0.03514862060546875, -0.0181427001953125, -0.00113677978515625, 0.015869140625, 0.03287506103515625, 0.0498809814453125, 0.06688690185546875, 0.083892822265625, 0.10089874267578125, 0.1179046630859375, 0.13491058349609375, 0.15191650390625, 0.16892242431640625, 0.1859283447265625, 0.20293426513671875, 0.219940185546875, 0.23694610595703125, 0.2539520263671875, 0.27095794677734375, 0.2879638671875, 0.30496978759765625, 0.3219757080078125, 0.33898162841796875, 0.355987548828125, 0.37299346923828125, 0.3899993896484375, 0.40700531005859375, 0.42401123046875, 0.44101715087890625, 0.4580230712890625, 0.47502899169921875, 0.492034912109375, 0.5090408325195312, 0.5260467529296875, 0.5430526733398438, 0.56005859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 4.0, 8.0, 12.0, 15.0, 24.0, 20.0, 43.0, 37.0, 63.0, 54.0, 68.0, 66.0, 85.0, 77.0, 85.0, 67.0, 51.0, 40.0, 41.0, 36.0, 28.0, 10.0, 10.0, 12.0, 5.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015535354614257812, -0.00149555504322052, -0.0014375746250152588, -0.0013795942068099976, -0.0013216137886047363, -0.001263633370399475, -0.0012056529521942139, -0.0011476725339889526, -0.0010896921157836914, -0.0010317116975784302, -0.0009737312793731689, -0.0009157508611679077, -0.0008577704429626465, -0.0007997900247573853, -0.000741809606552124, -0.0006838291883468628, -0.0006258487701416016, -0.0005678683519363403, -0.0005098879337310791, -0.00045190751552581787, -0.00039392709732055664, -0.0003359466791152954, -0.0002779662609100342, -0.00021998584270477295, -0.00016200542449951172, -0.00010402500629425049, -4.604458808898926e-05, 1.1935830116271973e-05, 6.99162483215332e-05, 0.00012789666652679443, 0.00018587708473205566, 0.0002438575029373169, 0.0003018379211425781, 0.00035981833934783936, 0.0004177987575531006, 0.0004757791757583618, 0.000533759593963623, 0.0005917400121688843, 0.0006497204303741455, 0.0007077008485794067, 0.000765681266784668, 0.0008236616849899292, 0.0008816421031951904, 0.0009396225214004517, 0.0009976029396057129, 0.0010555833578109741, 0.0011135637760162354, 0.0011715441942214966, 0.0012295246124267578, 0.001287505030632019, 0.0013454854488372803, 0.0014034658670425415, 0.0014614462852478027, 0.001519426703453064, 0.0015774071216583252, 0.0016353875398635864, 0.0016933679580688477, 0.0017513483762741089, 0.0018093287944793701, 0.0018673092126846313, 0.0019252896308898926, 0.001983270049095154, 0.002041250467300415, 0.0020992308855056763, 0.0021572113037109375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 6.0, 18.0, 18.0, 25.0, 36.0, 39.0, 45.0, 76.0, 88.0, 129.0, 190.0, 321.0, 483.0, 950.0, 8580.0, 1032903.0, 2423.0, 791.0, 427.0, 288.0, 175.0, 132.0, 90.0, 67.0, 65.0, 35.0, 26.0, 26.0, 15.0, 18.0, 6.0, 6.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.031258583068847656, -0.030229568481445312, -0.02920055389404297, -0.028171539306640625, -0.02714252471923828, -0.026113510131835938, -0.025084495544433594, -0.02405548095703125, -0.023026466369628906, -0.021997451782226562, -0.02096843719482422, -0.019939422607421875, -0.01891040802001953, -0.017881393432617188, -0.016852378845214844, -0.0158233642578125, -0.014794349670410156, -0.013765335083007812, -0.012736320495605469, -0.011707305908203125, -0.010678291320800781, -0.009649276733398438, -0.008620262145996094, -0.00759124755859375, -0.006562232971191406, -0.0055332183837890625, -0.004504203796386719, -0.003475189208984375, -0.0024461746215820312, -0.0014171600341796875, -0.00038814544677734375, 0.000640869140625, 0.0016698837280273438, 0.0026988983154296875, 0.0037279129028320312, 0.004756927490234375, 0.005785942077636719, 0.0068149566650390625, 0.007843971252441406, 0.00887298583984375, 0.009902000427246094, 0.010931015014648438, 0.011960029602050781, 0.012989044189453125, 0.014018058776855469, 0.015047073364257812, 0.016076087951660156, 0.0171051025390625, 0.018134117126464844, 0.019163131713867188, 0.02019214630126953, 0.021221160888671875, 0.02225017547607422, 0.023279190063476562, 0.024308204650878906, 0.02533721923828125, 0.026366233825683594, 0.027395248413085938, 0.02842426300048828, 0.029453277587890625, 0.03048229217529297, 0.03151130676269531, 0.032540321350097656, 0.0335693359375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 861.0, 139.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003612068947404623, -0.0033659166656434536, -0.003119764616712928, -0.002873612567782402, -0.0026274602860212326, -0.002381308004260063, -0.0021351559553295374, -0.0018890037899836898, -0.0016428516246378422, -0.0013966994592919946, -0.001150547293946147, -0.0009043951286002994, -0.0006582429632544518, -0.00041209079790860415, -0.00016593863256275654, 8.021353278309107e-05, 0.0003263656981289387, 0.0005725178634747863, 0.0008186700288206339, 0.0010648221941664815, 0.001310974359512329, 0.0015571265248581767, 0.0018032786902040243, 0.00204943073913455, 0.0022955830208957195, 0.002541735302656889, 0.0027878873515874147, 0.0030340394005179405, 0.00328019168227911, 0.0035263439640402794, 0.003772496012970805, 0.004018648061901331, 0.004264800809323788, 0.004510953091084957, 0.0047571053728461266, 0.005003257188946009, 0.005249409470707178, 0.0054955617524683475, 0.00574171356856823, 0.005987865850329399, 0.0062340181320905685, 0.006480170413851738, 0.006726322695612907, 0.0069724745117127895, 0.007218626793473959, 0.007464779075235128, 0.0077109308913350105, 0.00795708317309618, 0.00820323545485735, 0.008449387736618519, 0.008695540018379688, 0.008941692300140858, 0.009187843650579453, 0.009433995932340622, 0.009680148214101791, 0.00992630049586296, 0.01017245277762413, 0.0104186050593853, 0.010664757341146469, 0.010910909622907639, 0.011157061904668808, 0.011403213255107403, 0.011649365536868572, 0.011895517818629742, 0.012141670100390911]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 9.0, 4.0, 8.0, 2.0, 7.0, 10.0, 6.0, 14.0, 24.0, 21.0, 21.0, 27.0, 23.0, 37.0, 32.0, 42.0, 39.0, 40.0, 44.0, 42.0, 45.0, 39.0, 41.0, 43.0, 40.0, 36.0, 27.0, 36.0, 36.0, 30.0, 25.0, 26.0, 27.0, 21.0, 15.0, 14.0, 10.0, 8.0, 6.0, 11.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008364319801330566, -0.0008103298023343086, -0.0007842276245355606, -0.0007581254467368126, -0.0007320232689380646, -0.0007059210911393166, -0.0006798189133405685, -0.0006537167355418205, -0.0006276145577430725, -0.0006015123799443245, -0.0005754102021455765, -0.0005493080243468285, -0.0005232058465480804, -0.0004971036687493324, -0.0004710014909505844, -0.0004448993131518364, -0.0004187971353530884, -0.00039269495755434036, -0.00036659277975559235, -0.00034049060195684433, -0.0003143884241580963, -0.0002882862463593483, -0.0002621840685606003, -0.00023608189076185226, -0.00020997971296310425, -0.00018387753516435623, -0.00015777535736560822, -0.0001316731795668602, -0.00010557100176811218, -7.946882396936417e-05, -5.336664617061615e-05, -2.7264468371868134e-05, -1.1622905731201172e-06, 2.49398872256279e-05, 5.1042065024375916e-05, 7.714424282312393e-05, 0.00010324642062187195, 0.00012934859842061996, 0.00015545077621936798, 0.000181552954018116, 0.00020765513181686401, 0.00023375730961561203, 0.00025985948741436005, 0.00028596166521310806, 0.0003120638430118561, 0.0003381660208106041, 0.0003642681986093521, 0.00039037037640810013, 0.00041647255420684814, 0.00044257473200559616, 0.0004686769098043442, 0.0004947790876030922, 0.0005208812654018402, 0.0005469834432005882, 0.0005730856209993362, 0.0005991877987980843, 0.0006252899765968323, 0.0006513921543955803, 0.0006774943321943283, 0.0007035965099930763, 0.0007296986877918243, 0.0007558008655905724, 0.0007819030433893204, 0.0008080052211880684, 0.0008341073989868164]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 10.0, 4.0, 8.0, 9.0, 11.0, 8.0, 13.0, 17.0, 14.0, 15.0, 30.0, 29.0, 27.0, 33.0, 24.0, 43.0, 29.0, 31.0, 40.0, 33.0, 40.0, 48.0, 47.0, 43.0, 48.0, 40.0, 35.0, 34.0, 33.0, 34.0, 23.0, 24.0, 25.0, 10.0, 14.0, 10.0, 9.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.8359375, -3.70758056640625, -3.5792236328125, -3.45086669921875, -3.322509765625, -3.19415283203125, -3.0657958984375, -2.93743896484375, -2.80908203125, -2.68072509765625, -2.5523681640625, -2.42401123046875, -2.295654296875, -2.16729736328125, -2.0389404296875, -1.91058349609375, -1.7822265625, -1.65386962890625, -1.5255126953125, -1.39715576171875, -1.268798828125, -1.14044189453125, -1.0120849609375, -0.88372802734375, -0.75537109375, -0.62701416015625, -0.4986572265625, -0.37030029296875, -0.241943359375, -0.11358642578125, 0.0147705078125, 0.14312744140625, 0.271484375, 0.39984130859375, 0.5281982421875, 0.65655517578125, 0.784912109375, 0.91326904296875, 1.0416259765625, 1.16998291015625, 1.29833984375, 1.42669677734375, 1.5550537109375, 1.68341064453125, 1.811767578125, 1.94012451171875, 2.0684814453125, 2.19683837890625, 2.3251953125, 2.45355224609375, 2.5819091796875, 2.71026611328125, 2.838623046875, 2.96697998046875, 3.0953369140625, 3.22369384765625, 3.35205078125, 3.48040771484375, 3.6087646484375, 3.73712158203125, 3.865478515625, 3.99383544921875, 4.1221923828125, 4.25054931640625, 4.37890625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 15.0, 11.0, 12.0, 21.0, 25.0, 25.0, 42.0, 44.0, 58.0, 101.0, 102.0, 179.0, 222.0, 306.0, 427.0, 703.0, 1200.0, 2338.0, 5273.0, 14022.0, 53856.0, 323901.0, 524177.0, 87237.0, 20479.0, 6793.0, 2878.0, 1470.0, 836.0, 494.0, 361.0, 246.0, 181.0, 123.0, 101.0, 67.0, 47.0, 34.0, 28.0, 21.0, 15.0, 11.0, 9.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.90625, -6.67718505859375, -6.4481201171875, -6.21905517578125, -5.989990234375, -5.76092529296875, -5.5318603515625, -5.30279541015625, -5.07373046875, -4.84466552734375, -4.6156005859375, -4.38653564453125, -4.157470703125, -3.92840576171875, -3.6993408203125, -3.47027587890625, -3.2412109375, -3.01214599609375, -2.7830810546875, -2.55401611328125, -2.324951171875, -2.09588623046875, -1.8668212890625, -1.63775634765625, -1.40869140625, -1.17962646484375, -0.9505615234375, -0.72149658203125, -0.492431640625, -0.26336669921875, -0.0343017578125, 0.19476318359375, 0.423828125, 0.65289306640625, 0.8819580078125, 1.11102294921875, 1.340087890625, 1.56915283203125, 1.7982177734375, 2.02728271484375, 2.25634765625, 2.48541259765625, 2.7144775390625, 2.94354248046875, 3.172607421875, 3.40167236328125, 3.6307373046875, 3.85980224609375, 4.0888671875, 4.31793212890625, 4.5469970703125, 4.77606201171875, 5.005126953125, 5.23419189453125, 5.4632568359375, 5.69232177734375, 5.92138671875, 6.15045166015625, 6.3795166015625, 6.60858154296875, 6.837646484375, 7.06671142578125, 7.2957763671875, 7.52484130859375, 7.75390625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 11.0, 8.0, 9.0, 15.0, 19.0, 16.0, 17.0, 26.0, 27.0, 44.0, 51.0, 49.0, 85.0, 116.0, 448.0, 1597.0, 111.0, 73.0, 48.0, 47.0, 38.0, 45.0, 23.0, 23.0, 29.0, 14.0, 10.0, 4.0, 9.0, 5.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.40625, -9.991455078125, -9.57666015625, -9.161865234375, -8.7470703125, -8.332275390625, -7.91748046875, -7.502685546875, -7.087890625, -6.673095703125, -6.25830078125, -5.843505859375, -5.4287109375, -5.013916015625, -4.59912109375, -4.184326171875, -3.76953125, -3.354736328125, -2.93994140625, -2.525146484375, -2.1103515625, -1.695556640625, -1.28076171875, -0.865966796875, -0.451171875, -0.036376953125, 0.37841796875, 0.793212890625, 1.2080078125, 1.622802734375, 2.03759765625, 2.452392578125, 2.8671875, 3.281982421875, 3.69677734375, 4.111572265625, 4.5263671875, 4.941162109375, 5.35595703125, 5.770751953125, 6.185546875, 6.600341796875, 7.01513671875, 7.429931640625, 7.8447265625, 8.259521484375, 8.67431640625, 9.089111328125, 9.50390625, 9.918701171875, 10.33349609375, 10.748291015625, 11.1630859375, 11.577880859375, 11.99267578125, 12.407470703125, 12.822265625, 13.237060546875, 13.65185546875, 14.066650390625, 14.4814453125, 14.896240234375, 15.31103515625, 15.725830078125, 16.140625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 3.0, 9.0, 11.0, 7.0, 20.0, 21.0, 31.0, 56.0, 87.0, 129.0, 226.0, 455.0, 1288.0, 416160.0, 2724655.0, 1413.0, 469.0, 274.0, 119.0, 85.0, 55.0, 25.0, 24.0, 18.0, 14.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-47.71875, -46.46435546875, -45.2099609375, -43.95556640625, -42.701171875, -41.44677734375, -40.1923828125, -38.93798828125, -37.68359375, -36.42919921875, -35.1748046875, -33.92041015625, -32.666015625, -31.41162109375, -30.1572265625, -28.90283203125, -27.6484375, -26.39404296875, -25.1396484375, -23.88525390625, -22.630859375, -21.37646484375, -20.1220703125, -18.86767578125, -17.61328125, -16.35888671875, -15.1044921875, -13.85009765625, -12.595703125, -11.34130859375, -10.0869140625, -8.83251953125, -7.578125, -6.32373046875, -5.0693359375, -3.81494140625, -2.560546875, -1.30615234375, -0.0517578125, 1.20263671875, 2.45703125, 3.71142578125, 4.9658203125, 6.22021484375, 7.474609375, 8.72900390625, 9.9833984375, 11.23779296875, 12.4921875, 13.74658203125, 15.0009765625, 16.25537109375, 17.509765625, 18.76416015625, 20.0185546875, 21.27294921875, 22.52734375, 23.78173828125, 25.0361328125, 26.29052734375, 27.544921875, 28.79931640625, 30.0537109375, 31.30810546875, 32.5625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [4.0, 9.0, 19.0, 78.0, 153.0, 246.0, 259.0, 139.0, 70.0, 23.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.243184566497803, -3.504897117614746, -2.7666096687316895, -2.028322458267212, -1.2900350093841553, -0.5517475605010986, 0.1865396499633789, 0.9248270988464355, 1.6631145477294922, 2.401401996612549, 3.1396894454956055, 3.877976655960083, 4.616264343261719, 5.354551315307617, 6.092838764190674, 6.8311262130737305, 7.569413661956787, 8.307701110839844, 9.045988082885742, 9.784276008605957, 10.522562980651855, 11.26085090637207, 11.999137878417969, 12.737424850463867, 13.475712776184082, 14.21399974822998, 14.952287673950195, 15.690574645996094, 16.428861618041992, 17.167150497436523, 17.905437469482422, 18.64372444152832, 19.38201332092285, 20.12030029296875, 20.85858726501465, 21.59687614440918, 22.335163116455078, 23.073450088500977, 23.811737060546875, 24.550025939941406, 25.288312911987305, 26.026599884033203, 26.7648868560791, 27.503175735473633, 28.24146270751953, 28.97974967956543, 29.718036651611328, 30.45632553100586, 31.194610595703125, 31.932897567749023, 32.67118453979492, 33.40947341918945, 34.14775848388672, 34.88604736328125, 35.62433624267578, 36.36262130737305, 37.10091018676758, 37.83919906616211, 38.577484130859375, 39.315773010253906, 40.05405807495117, 40.7923469543457, 41.530635833740234, 42.2689208984375, 43.00720977783203]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 6.0, 3.0, 13.0, 11.0, 8.0, 14.0, 21.0, 15.0, 22.0, 23.0, 26.0, 33.0, 30.0, 30.0, 40.0, 43.0, 46.0, 40.0, 33.0, 43.0, 31.0, 40.0, 30.0, 35.0, 30.0, 46.0, 27.0, 25.0, 21.0, 28.0, 20.0, 16.0, 26.0, 22.0, 13.0, 14.0, 11.0, 11.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-23.05164337158203, -22.2810001373291, -21.510358810424805, -20.739715576171875, -19.969074249267578, -19.19843101501465, -18.42778778076172, -17.657146453857422, -16.886503219604492, -16.115859985351562, -15.345218658447266, -14.574575424194336, -13.803933143615723, -13.03329086303711, -12.26264762878418, -11.492005348205566, -10.721363067626953, -9.95072078704834, -9.180078506469727, -8.409435272216797, -7.638792991638184, -6.86815071105957, -6.097507953643799, -5.326865196228027, -4.556222915649414, -3.7855803966522217, -3.0149378776550293, -2.244295358657837, -1.4736528396606445, -0.7030103206634521, 0.06763219833374023, 0.8382749557495117, 1.608917236328125, 2.3795597553253174, 3.1502022743225098, 3.920844793319702, 4.6914873123168945, 5.462129592895508, 6.232772350311279, 7.003415107727051, 7.774057388305664, 8.544699668884277, 9.31534194946289, 10.08598518371582, 10.856627464294434, 11.627269744873047, 12.397912979125977, 13.16855525970459, 13.939197540283203, 14.709839820861816, 15.48048210144043, 16.25112533569336, 17.021766662597656, 17.792409896850586, 18.563053131103516, 19.333694458007812, 20.104337692260742, 20.874980926513672, 21.64562225341797, 22.4162654876709, 23.186908721923828, 23.957550048828125, 24.728193283081055, 25.498836517333984, 26.26947784423828]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 5.0, 10.0, 7.0, 10.0, 8.0, 17.0, 27.0, 19.0, 22.0, 27.0, 32.0, 33.0, 37.0, 33.0, 34.0, 60.0, 37.0, 38.0, 61.0, 49.0, 51.0, 45.0, 42.0, 35.0, 36.0, 42.0, 28.0, 21.0, 26.0, 16.0, 13.0, 10.0, 14.0, 13.0, 4.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.30859375, -5.1435546875, -4.978515625, -4.8134765625, -4.6484375, -4.4833984375, -4.318359375, -4.1533203125, -3.98828125, -3.8232421875, -3.658203125, -3.4931640625, -3.328125, -3.1630859375, -2.998046875, -2.8330078125, -2.66796875, -2.5029296875, -2.337890625, -2.1728515625, -2.0078125, -1.8427734375, -1.677734375, -1.5126953125, -1.34765625, -1.1826171875, -1.017578125, -0.8525390625, -0.6875, -0.5224609375, -0.357421875, -0.1923828125, -0.02734375, 0.1376953125, 0.302734375, 0.4677734375, 0.6328125, 0.7978515625, 0.962890625, 1.1279296875, 1.29296875, 1.4580078125, 1.623046875, 1.7880859375, 1.953125, 2.1181640625, 2.283203125, 2.4482421875, 2.61328125, 2.7783203125, 2.943359375, 3.1083984375, 3.2734375, 3.4384765625, 3.603515625, 3.7685546875, 3.93359375, 4.0986328125, 4.263671875, 4.4287109375, 4.59375, 4.7587890625, 4.923828125, 5.0888671875, 5.25390625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 9.0, 8.0, 17.0, 20.0, 26.0, 44.0, 32.0, 53.0, 76.0, 90.0, 107.0, 135.0, 210.0, 256.0, 385.0, 618.0, 1189.0, 3628.0, 46896.0, 3683444.0, 445041.0, 7740.0, 1744.0, 771.0, 491.0, 302.0, 207.0, 147.0, 145.0, 95.0, 79.0, 55.0, 35.0, 39.0, 30.0, 16.0, 23.0, 21.0, 9.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.446044921875, -29.48583984375, -28.525634765625, -27.5654296875, -26.605224609375, -25.64501953125, -24.684814453125, -23.724609375, -22.764404296875, -21.80419921875, -20.843994140625, -19.8837890625, -18.923583984375, -17.96337890625, -17.003173828125, -16.04296875, -15.082763671875, -14.12255859375, -13.162353515625, -12.2021484375, -11.241943359375, -10.28173828125, -9.321533203125, -8.361328125, -7.401123046875, -6.44091796875, -5.480712890625, -4.5205078125, -3.560302734375, -2.60009765625, -1.639892578125, -0.6796875, 0.280517578125, 1.24072265625, 2.200927734375, 3.1611328125, 4.121337890625, 5.08154296875, 6.041748046875, 7.001953125, 7.962158203125, 8.92236328125, 9.882568359375, 10.8427734375, 11.802978515625, 12.76318359375, 13.723388671875, 14.68359375, 15.643798828125, 16.60400390625, 17.564208984375, 18.5244140625, 19.484619140625, 20.44482421875, 21.405029296875, 22.365234375, 23.325439453125, 24.28564453125, 25.245849609375, 26.2060546875, 27.166259765625, 28.12646484375, 29.086669921875, 30.046875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 7.0, 14.0, 13.0, 27.0, 35.0, 43.0, 58.0, 112.0, 170.0, 245.0, 378.0, 514.0, 592.0, 523.0, 431.0, 279.0, 195.0, 144.0, 77.0, 57.0, 40.0, 31.0, 17.0, 15.0, 9.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.3671875, -9.0804443359375, -8.793701171875, -8.5069580078125, -8.22021484375, -7.9334716796875, -7.646728515625, -7.3599853515625, -7.0732421875, -6.7864990234375, -6.499755859375, -6.2130126953125, -5.92626953125, -5.6395263671875, -5.352783203125, -5.0660400390625, -4.779296875, -4.4925537109375, -4.205810546875, -3.9190673828125, -3.63232421875, -3.3455810546875, -3.058837890625, -2.7720947265625, -2.4853515625, -2.1986083984375, -1.911865234375, -1.6251220703125, -1.33837890625, -1.0516357421875, -0.764892578125, -0.4781494140625, -0.19140625, 0.0953369140625, 0.382080078125, 0.6688232421875, 0.95556640625, 1.2423095703125, 1.529052734375, 1.8157958984375, 2.1025390625, 2.3892822265625, 2.676025390625, 2.9627685546875, 3.24951171875, 3.5362548828125, 3.822998046875, 4.1097412109375, 4.396484375, 4.6832275390625, 4.969970703125, 5.2567138671875, 5.54345703125, 5.8302001953125, 6.116943359375, 6.4036865234375, 6.6904296875, 6.9771728515625, 7.263916015625, 7.5506591796875, 7.83740234375, 8.1241455078125, 8.410888671875, 8.6976318359375, 8.984375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 23.0, 12.0, 36.0, 52.0, 106.0, 274.0, 777.0, 2414.0, 11196.0, 105131.0, 2777698.0, 1233180.0, 53430.0, 7227.0, 1681.0, 582.0, 212.0, 103.0, 56.0, 24.0, 17.0, 10.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.61767578125, -10.1728515625, -9.72802734375, -9.283203125, -8.83837890625, -8.3935546875, -7.94873046875, -7.50390625, -7.05908203125, -6.6142578125, -6.16943359375, -5.724609375, -5.27978515625, -4.8349609375, -4.39013671875, -3.9453125, -3.50048828125, -3.0556640625, -2.61083984375, -2.166015625, -1.72119140625, -1.2763671875, -0.83154296875, -0.38671875, 0.05810546875, 0.5029296875, 0.94775390625, 1.392578125, 1.83740234375, 2.2822265625, 2.72705078125, 3.171875, 3.61669921875, 4.0615234375, 4.50634765625, 4.951171875, 5.39599609375, 5.8408203125, 6.28564453125, 6.73046875, 7.17529296875, 7.6201171875, 8.06494140625, 8.509765625, 8.95458984375, 9.3994140625, 9.84423828125, 10.2890625, 10.73388671875, 11.1787109375, 11.62353515625, 12.068359375, 12.51318359375, 12.9580078125, 13.40283203125, 13.84765625, 14.29248046875, 14.7373046875, 15.18212890625, 15.626953125, 16.07177734375, 16.5166015625, 16.96142578125, 17.40625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 11.0, 20.0, 38.0, 80.0, 93.0, 148.0, 170.0, 134.0, 132.0, 74.0, 45.0, 19.0, 10.0, 8.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.44524383544922, -54.77109909057617, -52.096954345703125, -49.422813415527344, -46.7486686706543, -44.07452392578125, -41.4003791809082, -38.726234436035156, -36.052093505859375, -33.37794876098633, -30.703805923461914, -28.029661178588867, -25.355518341064453, -22.681373596191406, -20.00722885131836, -17.333086013793945, -14.658939361572266, -11.984795570373535, -9.310651779174805, -6.636507034301758, -3.9623632431030273, -1.2882194519042969, 1.38592529296875, 4.060068130493164, 6.734212875366211, 9.408356666564941, 12.082500457763672, 14.756645202636719, 17.430789947509766, 20.10493278503418, 22.779077529907227, 25.45322036743164, 28.127365112304688, 30.801509857177734, 33.47565460205078, 36.14979553222656, 38.82394027709961, 41.498085021972656, 44.1722297668457, 46.84637451171875, 49.52051544189453, 52.19466018676758, 54.868804931640625, 57.542945861816406, 60.21709060668945, 62.8912353515625, 65.56538391113281, 68.2395248413086, 70.91366577148438, 73.58780670166016, 76.26195526123047, 78.93609619140625, 81.61024475097656, 84.28438568115234, 86.95852661132812, 89.63267517089844, 92.30682373046875, 94.98096466064453, 97.65511322021484, 100.32925415039062, 103.00340270996094, 105.67754364013672, 108.3516845703125, 111.02583312988281, 113.6999740600586]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 9.0, 15.0, 11.0, 17.0, 23.0, 24.0, 27.0, 28.0, 25.0, 29.0, 24.0, 42.0, 36.0, 38.0, 52.0, 37.0, 26.0, 48.0, 47.0, 30.0, 29.0, 41.0, 38.0, 32.0, 36.0, 35.0, 20.0, 19.0, 21.0, 18.0, 11.0, 18.0, 13.0, 7.0, 13.0, 8.0, 9.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.084197998046875, -26.1844482421875, -25.284700393676758, -24.384950637817383, -23.48520278930664, -22.585453033447266, -21.68570327758789, -20.785953521728516, -19.886205673217773, -18.9864559173584, -18.086708068847656, -17.18695831298828, -16.287208557128906, -15.387460708618164, -14.487710952758789, -13.58796215057373, -12.688213348388672, -11.788464546203613, -10.888715744018555, -9.98896598815918, -9.089217185974121, -8.189468383789062, -7.289719104766846, -6.389969825744629, -5.49022102355957, -4.590472221374512, -3.690722942352295, -2.7909739017486572, -1.8912248611450195, -0.9914760589599609, -0.09172677993774414, 0.8080224990844727, 1.7077693939208984, 2.607518434524536, 3.507267475128174, 4.407016754150391, 5.306765556335449, 6.206514358520508, 7.106263637542725, 8.006012916564941, 8.90576171875, 9.805510520935059, 10.705259323120117, 11.605009078979492, 12.50475788116455, 13.40450668334961, 14.304256439208984, 15.204005241394043, 16.1037540435791, 17.003503799438477, 17.90325164794922, 18.803001403808594, 19.70275115966797, 20.60249900817871, 21.502248764038086, 22.401996612548828, 23.301746368408203, 24.201496124267578, 25.10124397277832, 26.000993728637695, 26.900741577148438, 27.800491333007812, 28.700241088867188, 29.599990844726562, 30.499738693237305]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 9.0, 15.0, 11.0, 20.0, 18.0, 16.0, 22.0, 32.0, 20.0, 24.0, 29.0, 30.0, 31.0, 34.0, 43.0, 42.0, 35.0, 47.0, 33.0, 37.0, 31.0, 39.0, 40.0, 33.0, 30.0, 25.0, 31.0, 25.0, 26.0, 17.0, 15.0, 24.0, 14.0, 10.0, 8.0, 12.0, 6.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.59375, -41.2333984375, -39.873046875, -38.5126953125, -37.15234375, -35.7919921875, -34.431640625, -33.0712890625, -31.7109375, -30.3505859375, -28.990234375, -27.6298828125, -26.26953125, -24.9091796875, -23.548828125, -22.1884765625, -20.828125, -19.4677734375, -18.107421875, -16.7470703125, -15.38671875, -14.0263671875, -12.666015625, -11.3056640625, -9.9453125, -8.5849609375, -7.224609375, -5.8642578125, -4.50390625, -3.1435546875, -1.783203125, -0.4228515625, 0.9375, 2.2978515625, 3.658203125, 5.0185546875, 6.37890625, 7.7392578125, 9.099609375, 10.4599609375, 11.8203125, 13.1806640625, 14.541015625, 15.9013671875, 17.26171875, 18.6220703125, 19.982421875, 21.3427734375, 22.703125, 24.0634765625, 25.423828125, 26.7841796875, 28.14453125, 29.5048828125, 30.865234375, 32.2255859375, 33.5859375, 34.9462890625, 36.306640625, 37.6669921875, 39.02734375, 40.3876953125, 41.748046875, 43.1083984375, 44.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 12.0, 3.0, 15.0, 14.0, 21.0, 36.0, 46.0, 66.0, 92.0, 137.0, 163.0, 270.0, 365.0, 564.0, 745.0, 1106.0, 1590.0, 2315.0, 3508.0, 5365.0, 8277.0, 12489.0, 20248.0, 31952.0, 51580.0, 81918.0, 126912.0, 174760.0, 174876.0, 126072.0, 82268.0, 51296.0, 32045.0, 19996.0, 12728.0, 8158.0, 5377.0, 3475.0, 2378.0, 1586.0, 1075.0, 785.0, 574.0, 367.0, 270.0, 197.0, 136.0, 100.0, 61.0, 59.0, 30.0, 24.0, 19.0, 18.0, 3.0, 9.0, 4.0, 4.0, 4.0, 2.0], "bins": [-4.2265625, -4.094482421875, -3.96240234375, -3.830322265625, -3.6982421875, -3.566162109375, -3.43408203125, -3.302001953125, -3.169921875, -3.037841796875, -2.90576171875, -2.773681640625, -2.6416015625, -2.509521484375, -2.37744140625, -2.245361328125, -2.11328125, -1.981201171875, -1.84912109375, -1.717041015625, -1.5849609375, -1.452880859375, -1.32080078125, -1.188720703125, -1.056640625, -0.924560546875, -0.79248046875, -0.660400390625, -0.5283203125, -0.396240234375, -0.26416015625, -0.132080078125, 0.0, 0.132080078125, 0.26416015625, 0.396240234375, 0.5283203125, 0.660400390625, 0.79248046875, 0.924560546875, 1.056640625, 1.188720703125, 1.32080078125, 1.452880859375, 1.5849609375, 1.717041015625, 1.84912109375, 1.981201171875, 2.11328125, 2.245361328125, 2.37744140625, 2.509521484375, 2.6416015625, 2.773681640625, 2.90576171875, 3.037841796875, 3.169921875, 3.302001953125, 3.43408203125, 3.566162109375, 3.6982421875, 3.830322265625, 3.96240234375, 4.094482421875, 4.2265625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 4.0, 11.0, 7.0, 8.0, 14.0, 12.0, 21.0, 18.0, 27.0, 32.0, 31.0, 37.0, 37.0, 36.0, 39.0, 41.0, 51.0, 42.0, 1067.0, 41.0, 47.0, 49.0, 35.0, 48.0, 32.0, 38.0, 37.0, 23.0, 18.0, 26.0, 17.0, 19.0, 11.0, 11.0, 8.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.8125, -23.7919921875, -22.771484375, -21.7509765625, -20.73046875, -19.7099609375, -18.689453125, -17.6689453125, -16.6484375, -15.6279296875, -14.607421875, -13.5869140625, -12.56640625, -11.5458984375, -10.525390625, -9.5048828125, -8.484375, -7.4638671875, -6.443359375, -5.4228515625, -4.40234375, -3.3818359375, -2.361328125, -1.3408203125, -0.3203125, 0.7001953125, 1.720703125, 2.7412109375, 3.76171875, 4.7822265625, 5.802734375, 6.8232421875, 7.84375, 8.8642578125, 9.884765625, 10.9052734375, 11.92578125, 12.9462890625, 13.966796875, 14.9873046875, 16.0078125, 17.0283203125, 18.048828125, 19.0693359375, 20.08984375, 21.1103515625, 22.130859375, 23.1513671875, 24.171875, 25.1923828125, 26.212890625, 27.2333984375, 28.25390625, 29.2744140625, 30.294921875, 31.3154296875, 32.3359375, 33.3564453125, 34.376953125, 35.3974609375, 36.41796875, 37.4384765625, 38.458984375, 39.4794921875, 40.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 12.0, 13.0, 28.0, 23.0, 43.0, 66.0, 103.0, 143.0, 219.0, 323.0, 557.0, 878.0, 1367.0, 2179.0, 3615.0, 6280.0, 10174.0, 18275.0, 32544.0, 60119.0, 111510.0, 191309.0, 1279580.0, 167332.0, 93223.0, 50677.0, 27796.0, 15730.0, 9076.0, 5335.0, 3170.0, 2030.0, 1201.0, 823.0, 487.0, 290.0, 200.0, 133.0, 89.0, 58.0, 39.0, 32.0, 15.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.7578125, -5.585205078125, -5.41259765625, -5.239990234375, -5.0673828125, -4.894775390625, -4.72216796875, -4.549560546875, -4.376953125, -4.204345703125, -4.03173828125, -3.859130859375, -3.6865234375, -3.513916015625, -3.34130859375, -3.168701171875, -2.99609375, -2.823486328125, -2.65087890625, -2.478271484375, -2.3056640625, -2.133056640625, -1.96044921875, -1.787841796875, -1.615234375, -1.442626953125, -1.27001953125, -1.097412109375, -0.9248046875, -0.752197265625, -0.57958984375, -0.406982421875, -0.234375, -0.061767578125, 0.11083984375, 0.283447265625, 0.4560546875, 0.628662109375, 0.80126953125, 0.973876953125, 1.146484375, 1.319091796875, 1.49169921875, 1.664306640625, 1.8369140625, 2.009521484375, 2.18212890625, 2.354736328125, 2.52734375, 2.699951171875, 2.87255859375, 3.045166015625, 3.2177734375, 3.390380859375, 3.56298828125, 3.735595703125, 3.908203125, 4.080810546875, 4.25341796875, 4.426025390625, 4.5986328125, 4.771240234375, 4.94384765625, 5.116455078125, 5.2890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 10.0, 3.0, 8.0, 11.0, 12.0, 7.0, 22.0, 15.0, 24.0, 24.0, 43.0, 37.0, 61.0, 74.0, 93.0, 79.0, 76.0, 66.0, 52.0, 44.0, 41.0, 36.0, 27.0, 15.0, 18.0, 10.0, 9.0, 15.0, 13.0, 3.0, 7.0, 2.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.06610107421875, -0.06407356262207031, -0.062046051025390625, -0.06001853942871094, -0.05799102783203125, -0.05596351623535156, -0.053936004638671875, -0.05190849304199219, -0.0498809814453125, -0.04785346984863281, -0.045825958251953125, -0.04379844665527344, -0.04177093505859375, -0.03974342346191406, -0.037715911865234375, -0.03568840026855469, -0.033660888671875, -0.03163337707519531, -0.029605865478515625, -0.027578353881835938, -0.02555084228515625, -0.023523330688476562, -0.021495819091796875, -0.019468307495117188, -0.0174407958984375, -0.015413284301757812, -0.013385772705078125, -0.011358261108398438, -0.00933074951171875, -0.0073032379150390625, -0.005275726318359375, -0.0032482147216796875, -0.001220703125, 0.0008068084716796875, 0.002834320068359375, 0.0048618316650390625, 0.00688934326171875, 0.008916854858398438, 0.010944366455078125, 0.012971878051757812, 0.0149993896484375, 0.017026901245117188, 0.019054412841796875, 0.021081924438476562, 0.02310943603515625, 0.025136947631835938, 0.027164459228515625, 0.029191970825195312, 0.031219482421875, 0.03324699401855469, 0.035274505615234375, 0.03730201721191406, 0.03932952880859375, 0.04135704040527344, 0.043384552001953125, 0.04541206359863281, 0.0474395751953125, 0.04946708679199219, 0.051494598388671875, 0.05352210998535156, 0.05554962158203125, 0.05757713317871094, 0.059604644775390625, 0.06163215637207031, 0.06365966796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 4.0, 12.0, 17.0, 9.0, 17.0, 21.0, 26.0, 31.0, 28.0, 46.0, 53.0, 74.0, 80.0, 96.0, 132.0, 164.0, 244.0, 326.0, 556.0, 1035.0, 2121.0, 5079.0, 13413.0, 40509.0, 142992.0, 513543.0, 234296.0, 60817.0, 19499.0, 6974.0, 2861.0, 1247.0, 655.0, 380.0, 271.0, 172.0, 150.0, 113.0, 91.0, 74.0, 58.0, 54.0, 43.0, 37.0, 36.0, 19.0, 15.0, 13.0, 9.0, 3.0, 12.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.36376953125, -0.3522834777832031, -0.34079742431640625, -0.3293113708496094, -0.3178253173828125, -0.3063392639160156, -0.29485321044921875, -0.2833671569824219, -0.271881103515625, -0.2603950500488281, -0.24890899658203125, -0.23742294311523438, -0.2259368896484375, -0.21445083618164062, -0.20296478271484375, -0.19147872924804688, -0.17999267578125, -0.16850662231445312, -0.15702056884765625, -0.14553451538085938, -0.1340484619140625, -0.12256240844726562, -0.11107635498046875, -0.09959030151367188, -0.088104248046875, -0.07661819458007812, -0.06513214111328125, -0.053646087646484375, -0.0421600341796875, -0.030673980712890625, -0.01918792724609375, -0.007701873779296875, 0.0037841796875, 0.015270233154296875, 0.02675628662109375, 0.038242340087890625, 0.0497283935546875, 0.061214447021484375, 0.07270050048828125, 0.08418655395507812, 0.095672607421875, 0.10715866088867188, 0.11864471435546875, 0.13013076782226562, 0.1416168212890625, 0.15310287475585938, 0.16458892822265625, 0.17607498168945312, 0.18756103515625, 0.19904708862304688, 0.21053314208984375, 0.22201919555664062, 0.2335052490234375, 0.24499130249023438, 0.25647735595703125, 0.2679634094238281, 0.279449462890625, 0.2909355163574219, 0.30242156982421875, 0.3139076232910156, 0.3253936767578125, 0.3368797302246094, 0.34836578369140625, 0.3598518371582031, 0.371337890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 13.0, 20.0, 14.0, 31.0, 72.0, 112.0, 174.0, 165.0, 141.0, 92.0, 62.0, 37.0, 14.0, 14.0, 10.0, 13.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07205367088317871, -0.06828658282756805, -0.0645194947719574, -0.06075240299105644, -0.056985314935445786, -0.05321822315454483, -0.049451135098934174, -0.04568404704332352, -0.04191695898771286, -0.0381498709321022, -0.03438277915120125, -0.03061569109559059, -0.026848603039979935, -0.02308151312172413, -0.019314423203468323, -0.015547335147857666, -0.01178024336695671, -0.00801315438002348, -0.004246064927428961, -0.00047897547483444214, 0.003288113512098789, 0.007055202499032021, 0.010822292417287827, 0.014589380472898483, 0.01835647039115429, 0.022123560309410095, 0.025890648365020752, 0.029657738283276558, 0.033424828201532364, 0.03719191625714302, 0.040959008038043976, 0.04472609609365463, 0.04849318414926529, 0.052260272204875946, 0.0560273639857769, 0.05979445204138756, 0.06356154382228851, 0.06732863187789917, 0.07109571993350983, 0.07486280798912048, 0.07862989604473114, 0.0823969841003418, 0.08616407215595245, 0.08993116021156311, 0.09369825571775436, 0.09746534377336502, 0.10123243182897568, 0.10499951988458633, 0.10876661539077759, 0.11253370344638824, 0.1163007915019989, 0.12006787955760956, 0.12383497506380081, 0.12760205566883087, 0.13136914372444153, 0.13513624668121338, 0.13890331983566284, 0.1426704078912735, 0.14643749594688416, 0.1502045840024948, 0.15397167205810547, 0.15773876011371613, 0.16150584816932678, 0.16527295112609863, 0.1690400391817093]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 11.0, 13.0, 14.0, 16.0, 19.0, 27.0, 23.0, 27.0, 29.0, 28.0, 43.0, 31.0, 41.0, 52.0, 29.0, 39.0, 45.0, 48.0, 33.0, 45.0, 36.0, 32.0, 34.0, 24.0, 23.0, 20.0, 24.0, 23.0, 25.0, 20.0, 15.0, 14.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.03513616323471069, -0.03407980874180794, -0.03302345424890518, -0.03196709603071213, -0.030910741537809372, -0.029854387044906616, -0.02879803068935871, -0.027741674333810806, -0.02668531984090805, -0.025628965348005295, -0.02457260899245739, -0.023516252636909485, -0.02245989814400673, -0.021403543651103973, -0.02034718729555607, -0.019290830940008163, -0.018234476447105408, -0.017178121954202652, -0.016121765598654747, -0.015065410174429417, -0.014009054750204086, -0.012952699325978756, -0.011896343901753426, -0.010839988477528095, -0.009783633053302765, -0.008727277629077435, -0.007670922204852104, -0.006614566780626774, -0.0055582113564014435, -0.004501855932176113, -0.0034455005079507828, -0.0023891450837254524, -0.001332789659500122, -0.0002764342352747917, 0.0007799211889505386, 0.001836276613175869, 0.0028926320374011993, 0.00394898746162653, 0.00500534288585186, 0.00606169831007719, 0.007118053734302521, 0.008174409158527851, 0.009230764582753181, 0.010287120006978512, 0.011343475431203842, 0.012399830855429173, 0.013456186279654503, 0.014512541703879833, 0.015568897128105164, 0.01662525162100792, 0.017681607976555824, 0.01873796433210373, 0.019794318825006485, 0.02085067331790924, 0.021907029673457146, 0.02296338602900505, 0.024019740521907806, 0.025076095014810562, 0.026132451370358467, 0.027188807725906372, 0.028245162218809128, 0.029301516711711884, 0.03035787306725979, 0.031414229422807693, 0.03247058391571045]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 15.0, 10.0, 19.0, 20.0, 16.0, 20.0, 31.0, 23.0, 24.0, 30.0, 26.0, 34.0, 35.0, 42.0, 42.0, 34.0, 49.0, 31.0, 36.0, 34.0, 38.0, 39.0, 34.0, 33.0, 20.0, 34.0, 25.0, 25.0, 13.0, 20.0, 23.0, 13.0, 11.0, 7.0, 13.0, 6.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.5625, -41.20361328125, -39.8447265625, -38.48583984375, -37.126953125, -35.76806640625, -34.4091796875, -33.05029296875, -31.69140625, -30.33251953125, -28.9736328125, -27.61474609375, -26.255859375, -24.89697265625, -23.5380859375, -22.17919921875, -20.8203125, -19.46142578125, -18.1025390625, -16.74365234375, -15.384765625, -14.02587890625, -12.6669921875, -11.30810546875, -9.94921875, -8.59033203125, -7.2314453125, -5.87255859375, -4.513671875, -3.15478515625, -1.7958984375, -0.43701171875, 0.921875, 2.28076171875, 3.6396484375, 4.99853515625, 6.357421875, 7.71630859375, 9.0751953125, 10.43408203125, 11.79296875, 13.15185546875, 14.5107421875, 15.86962890625, 17.228515625, 18.58740234375, 19.9462890625, 21.30517578125, 22.6640625, 24.02294921875, 25.3818359375, 26.74072265625, 28.099609375, 29.45849609375, 30.8173828125, 32.17626953125, 33.53515625, 34.89404296875, 36.2529296875, 37.61181640625, 38.970703125, 40.32958984375, 41.6884765625, 43.04736328125, 44.40625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 11.0, 14.0, 13.0, 15.0, 17.0, 36.0, 38.0, 59.0, 83.0, 101.0, 189.0, 305.0, 539.0, 892.0, 1645.0, 2976.0, 6207.0, 16346.0, 60693.0, 306090.0, 501120.0, 108559.0, 25467.0, 8656.0, 3762.0, 1906.0, 1052.0, 652.0, 382.0, 225.0, 145.0, 112.0, 54.0, 45.0, 39.0, 31.0, 16.0, 11.0, 13.0, 9.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.5234375, -11.1539306640625, -10.784423828125, -10.4149169921875, -10.04541015625, -9.6759033203125, -9.306396484375, -8.9368896484375, -8.5673828125, -8.1978759765625, -7.828369140625, -7.4588623046875, -7.08935546875, -6.7198486328125, -6.350341796875, -5.9808349609375, -5.611328125, -5.2418212890625, -4.872314453125, -4.5028076171875, -4.13330078125, -3.7637939453125, -3.394287109375, -3.0247802734375, -2.6552734375, -2.2857666015625, -1.916259765625, -1.5467529296875, -1.17724609375, -0.8077392578125, -0.438232421875, -0.0687255859375, 0.30078125, 0.6702880859375, 1.039794921875, 1.4093017578125, 1.77880859375, 2.1483154296875, 2.517822265625, 2.8873291015625, 3.2568359375, 3.6263427734375, 3.995849609375, 4.3653564453125, 4.73486328125, 5.1043701171875, 5.473876953125, 5.8433837890625, 6.212890625, 6.5823974609375, 6.951904296875, 7.3214111328125, 7.69091796875, 8.0604248046875, 8.429931640625, 8.7994384765625, 9.1689453125, 9.5384521484375, 9.907958984375, 10.2774658203125, 10.64697265625, 11.0164794921875, 11.385986328125, 11.7554931640625, 12.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 17.0, 9.0, 25.0, 32.0, 37.0, 54.0, 67.0, 94.0, 81.0, 1971.0, 275.0, 78.0, 80.0, 59.0, 44.0, 39.0, 32.0, 14.0, 15.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.875, -143.7626953125, -139.650390625, -135.5380859375, -131.42578125, -127.3134765625, -123.201171875, -119.0888671875, -114.9765625, -110.8642578125, -106.751953125, -102.6396484375, -98.52734375, -94.4150390625, -90.302734375, -86.1904296875, -82.078125, -77.9658203125, -73.853515625, -69.7412109375, -65.62890625, -61.5166015625, -57.404296875, -53.2919921875, -49.1796875, -45.0673828125, -40.955078125, -36.8427734375, -32.73046875, -28.6181640625, -24.505859375, -20.3935546875, -16.28125, -12.1689453125, -8.056640625, -3.9443359375, 0.16796875, 4.2802734375, 8.392578125, 12.5048828125, 16.6171875, 20.7294921875, 24.841796875, 28.9541015625, 33.06640625, 37.1787109375, 41.291015625, 45.4033203125, 49.515625, 53.6279296875, 57.740234375, 61.8525390625, 65.96484375, 70.0771484375, 74.189453125, 78.3017578125, 82.4140625, 86.5263671875, 90.638671875, 94.7509765625, 98.86328125, 102.9755859375, 107.087890625, 111.2001953125, 115.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 16.0, 12.0, 20.0, 24.0, 46.0, 78.0, 112.0, 254.0, 500.0, 1309.0, 4723.0, 149646.0, 2966920.0, 18150.0, 2321.0, 790.0, 343.0, 191.0, 93.0, 52.0, 36.0, 26.0, 14.0, 11.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.4013671875, -29.396484375, -28.3916015625, -27.38671875, -26.3818359375, -25.376953125, -24.3720703125, -23.3671875, -22.3623046875, -21.357421875, -20.3525390625, -19.34765625, -18.3427734375, -17.337890625, -16.3330078125, -15.328125, -14.3232421875, -13.318359375, -12.3134765625, -11.30859375, -10.3037109375, -9.298828125, -8.2939453125, -7.2890625, -6.2841796875, -5.279296875, -4.2744140625, -3.26953125, -2.2646484375, -1.259765625, -0.2548828125, 0.75, 1.7548828125, 2.759765625, 3.7646484375, 4.76953125, 5.7744140625, 6.779296875, 7.7841796875, 8.7890625, 9.7939453125, 10.798828125, 11.8037109375, 12.80859375, 13.8134765625, 14.818359375, 15.8232421875, 16.828125, 17.8330078125, 18.837890625, 19.8427734375, 20.84765625, 21.8525390625, 22.857421875, 23.8623046875, 24.8671875, 25.8720703125, 26.876953125, 27.8818359375, 28.88671875, 29.8916015625, 30.896484375, 31.9013671875, 32.90625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 11.0, 24.0, 68.0, 167.0, 347.0, 225.0, 93.0, 26.0, 19.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.62771606445312, -86.21513366699219, -78.80254364013672, -71.38995361328125, -63.97737121582031, -56.56478500366211, -49.152198791503906, -41.7396125793457, -34.3270263671875, -26.914440155029297, -19.501853942871094, -12.08926773071289, -4.6766815185546875, 2.7359046936035156, 10.148490905761719, 17.561077117919922, 24.973663330078125, 32.38624954223633, 39.79883575439453, 47.211421966552734, 54.62400817871094, 62.03659439086914, 69.44918060302734, 76.86177062988281, 84.27435302734375, 91.68693542480469, 99.09952545166016, 106.51211547851562, 113.92469787597656, 121.3372802734375, 128.7498779296875, 136.16246032714844, 143.57504272460938, 150.9876251220703, 158.40020751953125, 165.81280517578125, 173.2253875732422, 180.63796997070312, 188.05056762695312, 195.46315002441406, 202.875732421875, 210.28831481933594, 217.70089721679688, 225.11349487304688, 232.5260772705078, 239.93865966796875, 247.35125732421875, 254.7638397216797, 262.1764221191406, 269.5890197753906, 277.0015869140625, 284.4141845703125, 291.8267822265625, 299.2393493652344, 306.6519470214844, 314.06451416015625, 321.47711181640625, 328.88970947265625, 336.3022766113281, 343.7148742675781, 351.12744140625, 358.5400390625, 365.95263671875, 373.3652038574219, 380.7778015136719]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 12.0, 12.0, 19.0, 15.0, 25.0, 35.0, 29.0, 34.0, 48.0, 53.0, 53.0, 55.0, 51.0, 49.0, 43.0, 46.0, 61.0, 41.0, 42.0, 61.0, 34.0, 25.0, 19.0, 19.0, 22.0, 21.0, 8.0, 9.0, 12.0, 10.0, 3.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.47296142578125, -111.21401977539062, -107.955078125, -104.69613647460938, -101.43719482421875, -98.17825317382812, -94.9193115234375, -91.66036987304688, -88.40142822265625, -85.14248657226562, -81.883544921875, -78.62460327148438, -75.36566162109375, -72.10671997070312, -68.8477783203125, -65.58883666992188, -62.32990264892578, -59.070960998535156, -55.81201934814453, -52.553077697753906, -49.29413604736328, -46.035194396972656, -42.7762565612793, -39.51731491088867, -36.25837326049805, -32.99943161010742, -29.740489959716797, -26.481550216674805, -23.22260856628418, -19.963666915893555, -16.704727172851562, -13.445785522460938, -10.186843872070312, -6.927902698516846, -3.668961524963379, -0.4100208282470703, 2.8489208221435547, 6.10786247253418, 9.366802215576172, 12.625743865966797, 15.884685516357422, 19.143627166748047, 22.402568817138672, 25.661508560180664, 28.92045021057129, 32.17938995361328, 35.438331604003906, 38.69727325439453, 41.956214904785156, 45.21515655517578, 48.474098205566406, 51.73303985595703, 54.991981506347656, 58.25092315673828, 61.50986099243164, 64.768798828125, 68.02774047851562, 71.28668212890625, 74.54562377929688, 77.8045654296875, 81.06350708007812, 84.32244873046875, 87.58139038085938, 90.84033203125, 94.09927368164062]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 15.0, 19.0, 28.0, 37.0, 65.0, 92.0, 131.0, 141.0, 191.0, 285.0, 343.0, 465.0, 624.0, 905.0, 1040176.0, 1711.0, 904.0, 612.0, 418.0, 344.0, 272.0, 213.0, 138.0, 121.0, 81.0, 50.0, 48.0, 22.0, 30.0, 18.0, 15.0, 10.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.43365478515625, -26.28952980041504, -25.145404815673828, -24.00128173828125, -22.85715675354004, -21.713031768798828, -20.568906784057617, -19.424781799316406, -18.280658721923828, -17.136533737182617, -15.992409706115723, -14.848284721374512, -13.704160690307617, -12.560035705566406, -11.415910720825195, -10.2717866897583, -9.127660751342773, -7.983536243438721, -6.839411735534668, -5.695286750793457, -4.551162242889404, -3.4070377349853516, -2.2629127502441406, -1.118788719177246, 0.025336265563964844, 1.1694608926773071, 2.3135855197906494, 3.4577102661132812, 4.601834774017334, 5.745959281921387, 6.890084266662598, 8.034208297729492, 9.178333282470703, 10.322458267211914, 11.466582298278809, 12.61070728302002, 13.754831314086914, 14.898956298828125, 16.043081283569336, 17.187206268310547, 18.331329345703125, 19.475454330444336, 20.619579315185547, 21.763702392578125, 22.907827377319336, 24.051952362060547, 25.196077346801758, 26.34020233154297, 27.48432731628418, 28.62845230102539, 29.7725772857666, 30.916702270507812, 32.06082534790039, 33.20494842529297, 34.34907531738281, 35.49319839477539, 36.637325286865234, 37.78144836425781, 38.925575256347656, 40.069698333740234, 41.21382522583008, 42.357948303222656, 43.5020751953125, 44.64619827270508, 45.790321350097656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 6.0, 4.0, 6.0, 8.0, 10.0, 18.0, 31.0, 57.0, 153.0, 10681.0, 51451892.0, 170.0, 48.0, 18.0, 14.0, 6.0, 7.0, 3.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2576.9765625, -2478.245849609375, -2379.51513671875, -2280.784423828125, -2182.0537109375, -2083.322998046875, -1984.59228515625, -1885.861572265625, -1787.130859375, -1688.400146484375, -1589.66943359375, -1490.938720703125, -1392.2080078125, -1293.477294921875, -1194.74658203125, -1096.015869140625, -997.2850341796875, -898.5543212890625, -799.8236083984375, -701.0928955078125, -602.3621826171875, -503.6314392089844, -404.90069580078125, -306.16998291015625, -207.43927001953125, -108.70854949951172, -9.977828979492188, 88.75289916992188, 187.48361206054688, 286.2143249511719, 384.945068359375, 483.67578125, 582.406494140625, 681.13720703125, 779.867919921875, 878.5986328125, 977.329345703125, 1076.06005859375, 1174.790771484375, 1273.521484375, 1372.252197265625, 1470.98291015625, 1569.713623046875, 1668.4443359375, 1767.175048828125, 1865.90576171875, 1964.636474609375, 2063.3671875, 2162.09814453125, 2260.828857421875, 2359.5595703125, 2458.290283203125, 2557.02099609375, 2655.751708984375, 2754.482421875, 2853.213134765625, 2951.94384765625, 3050.674560546875, 3149.4052734375, 3248.135986328125, 3346.86669921875, 3445.597412109375, 3544.328125, 3643.058837890625, 3741.78955078125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 7.0, 7.0, 22.0, 38.0, 42.0, 63.0, 92.0, 121.0, 151.0, 202.0, 296.0, 379.0, 493.0, 833.0, 1177.0, 1647.0, 2427.0, 3529.0, 5489.0, 8623.0, 13538.0, 22836.0, 38799.0, 68611.0, 129379.0, 244227.0, 442904.0, 2928465.0, 1457480.0, 414743.0, 226887.0, 119603.0, 64500.0, 35892.0, 21091.0, 12758.0, 8105.0, 5143.0, 3307.0, 2320.0, 1588.0, 1052.0, 706.0, 546.0, 346.0, 290.0, 201.0, 130.0, 88.0, 74.0, 60.0, 34.0, 28.0, 23.0, 19.0, 10.0, 8.0, 5.0], "bins": [-2.091796875, -2.0301666259765625, -1.968536376953125, -1.9069061279296875, -1.84527587890625, -1.7836456298828125, -1.722015380859375, -1.6603851318359375, -1.5987548828125, -1.5371246337890625, -1.475494384765625, -1.4138641357421875, -1.35223388671875, -1.2906036376953125, -1.228973388671875, -1.1673431396484375, -1.105712890625, -1.0440826416015625, -0.982452392578125, -0.9208221435546875, -0.85919189453125, -0.7975616455078125, -0.735931396484375, -0.6743011474609375, -0.6126708984375, -0.5510406494140625, -0.489410400390625, -0.4277801513671875, -0.36614990234375, -0.3045196533203125, -0.242889404296875, -0.1812591552734375, -0.11962890625, -0.0579986572265625, 0.003631591796875, 0.0652618408203125, 0.12689208984375, 0.1885223388671875, 0.250152587890625, 0.3117828369140625, 0.3734130859375, 0.4350433349609375, 0.496673583984375, 0.5583038330078125, 0.61993408203125, 0.6815643310546875, 0.743194580078125, 0.8048248291015625, 0.866455078125, 0.9280853271484375, 0.989715576171875, 1.0513458251953125, 1.11297607421875, 1.1746063232421875, 1.236236572265625, 1.2978668212890625, 1.3594970703125, 1.4211273193359375, 1.482757568359375, 1.5443878173828125, 1.60601806640625, 1.6676483154296875, 1.729278564453125, 1.7909088134765625, 1.8525390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 9.0, 10.0, 6.0, 10.0, 15.0, 7.0, 17.0, 21.0, 14.0, 23.0, 36.0, 32.0, 34.0, 31.0, 33.0, 44.0, 37.0, 46.0, 129.0, 759.0, 244.0, 43.0, 33.0, 39.0, 45.0, 37.0, 32.0, 20.0, 25.0, 22.0, 26.0, 18.0, 20.0, 29.0, 11.0, 8.0, 13.0, 6.0, 4.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.2890625, -8.966552734375, -8.64404296875, -8.321533203125, -7.9990234375, -7.676513671875, -7.35400390625, -7.031494140625, -6.708984375, -6.386474609375, -6.06396484375, -5.741455078125, -5.4189453125, -5.096435546875, -4.77392578125, -4.451416015625, -4.12890625, -3.806396484375, -3.48388671875, -3.161376953125, -2.8388671875, -2.516357421875, -2.19384765625, -1.871337890625, -1.548828125, -1.226318359375, -0.90380859375, -0.581298828125, -0.2587890625, 0.063720703125, 0.38623046875, 0.708740234375, 1.03125, 1.353759765625, 1.67626953125, 1.998779296875, 2.3212890625, 2.643798828125, 2.96630859375, 3.288818359375, 3.611328125, 3.933837890625, 4.25634765625, 4.578857421875, 4.9013671875, 5.223876953125, 5.54638671875, 5.868896484375, 6.19140625, 6.513916015625, 6.83642578125, 7.158935546875, 7.4814453125, 7.803955078125, 8.12646484375, 8.448974609375, 8.771484375, 9.093994140625, 9.41650390625, 9.739013671875, 10.0615234375, 10.384033203125, 10.70654296875, 11.029052734375, 11.3515625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 10.0, 32.0, 33.0, 42.0, 73.0, 108.0, 167.0, 223.0, 294.0, 451.0, 638.0, 1065.0, 1621.0, 2474.0, 3801.0, 5940.0, 9829.0, 15979.0, 27510.0, 47915.0, 84866.0, 156282.0, 298747.0, 587823.0, 3764142.0, 606279.0, 308329.0, 160117.0, 86595.0, 48067.0, 28051.0, 16457.0, 10107.0, 6183.0, 3929.0, 2487.0, 1591.0, 1032.0, 715.0, 454.0, 325.0, 218.0, 128.0, 96.0, 68.0, 30.0, 24.0, 18.0, 25.0, 15.0, 10.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0], "bins": [-2.296875, -2.22161865234375, -2.1463623046875, -2.07110595703125, -1.995849609375, -1.92059326171875, -1.8453369140625, -1.77008056640625, -1.69482421875, -1.61956787109375, -1.5443115234375, -1.46905517578125, -1.393798828125, -1.31854248046875, -1.2432861328125, -1.16802978515625, -1.0927734375, -1.01751708984375, -0.9422607421875, -0.86700439453125, -0.791748046875, -0.71649169921875, -0.6412353515625, -0.56597900390625, -0.49072265625, -0.41546630859375, -0.3402099609375, -0.26495361328125, -0.189697265625, -0.11444091796875, -0.0391845703125, 0.03607177734375, 0.111328125, 0.18658447265625, 0.2618408203125, 0.33709716796875, 0.412353515625, 0.48760986328125, 0.5628662109375, 0.63812255859375, 0.71337890625, 0.78863525390625, 0.8638916015625, 0.93914794921875, 1.014404296875, 1.08966064453125, 1.1649169921875, 1.24017333984375, 1.3154296875, 1.39068603515625, 1.4659423828125, 1.54119873046875, 1.616455078125, 1.69171142578125, 1.7669677734375, 1.84222412109375, 1.91748046875, 1.99273681640625, 2.0679931640625, 2.14324951171875, 2.218505859375, 2.29376220703125, 2.3690185546875, 2.44427490234375, 2.51953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 4.0, 2.0, 14.0, 13.0, 22.0, 17.0, 19.0, 12.0, 20.0, 28.0, 20.0, 37.0, 29.0, 30.0, 36.0, 31.0, 39.0, 36.0, 101.0, 681.0, 338.0, 57.0, 41.0, 42.0, 40.0, 47.0, 39.0, 23.0, 23.0, 25.0, 19.0, 21.0, 26.0, 12.0, 13.0, 11.0, 12.0, 8.0, 6.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.90625, -7.666259765625, -7.42626953125, -7.186279296875, -6.9462890625, -6.706298828125, -6.46630859375, -6.226318359375, -5.986328125, -5.746337890625, -5.50634765625, -5.266357421875, -5.0263671875, -4.786376953125, -4.54638671875, -4.306396484375, -4.06640625, -3.826416015625, -3.58642578125, -3.346435546875, -3.1064453125, -2.866455078125, -2.62646484375, -2.386474609375, -2.146484375, -1.906494140625, -1.66650390625, -1.426513671875, -1.1865234375, -0.946533203125, -0.70654296875, -0.466552734375, -0.2265625, 0.013427734375, 0.25341796875, 0.493408203125, 0.7333984375, 0.973388671875, 1.21337890625, 1.453369140625, 1.693359375, 1.933349609375, 2.17333984375, 2.413330078125, 2.6533203125, 2.893310546875, 3.13330078125, 3.373291015625, 3.61328125, 3.853271484375, 4.09326171875, 4.333251953125, 4.5732421875, 4.813232421875, 5.05322265625, 5.293212890625, 5.533203125, 5.773193359375, 6.01318359375, 6.253173828125, 6.4931640625, 6.733154296875, 6.97314453125, 7.213134765625, 7.453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 13.0, 24.0, 26.0, 32.0, 50.0, 71.0, 72.0, 105.0, 136.0, 192.0, 289.0, 312.0, 452.0, 706.0, 965.0, 1557.0, 2628.0, 4359.0, 8559.0, 19359.0, 62235.0, 5495867.0, 595629.0, 58679.0, 18992.0, 8323.0, 4279.0, 2475.0, 1561.0, 1012.0, 672.0, 460.0, 353.0, 259.0, 159.0, 140.0, 100.0, 84.0, 61.0, 42.0, 39.0, 27.0, 21.0, 12.0, 14.0, 12.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.609375, -10.2877197265625, -9.966064453125, -9.6444091796875, -9.32275390625, -9.0010986328125, -8.679443359375, -8.3577880859375, -8.0361328125, -7.7144775390625, -7.392822265625, -7.0711669921875, -6.74951171875, -6.4278564453125, -6.106201171875, -5.7845458984375, -5.462890625, -5.1412353515625, -4.819580078125, -4.4979248046875, -4.17626953125, -3.8546142578125, -3.532958984375, -3.2113037109375, -2.8896484375, -2.5679931640625, -2.246337890625, -1.9246826171875, -1.60302734375, -1.2813720703125, -0.959716796875, -0.6380615234375, -0.31640625, 0.0052490234375, 0.326904296875, 0.6485595703125, 0.97021484375, 1.2918701171875, 1.613525390625, 1.9351806640625, 2.2568359375, 2.5784912109375, 2.900146484375, 3.2218017578125, 3.54345703125, 3.8651123046875, 4.186767578125, 4.5084228515625, 4.830078125, 5.1517333984375, 5.473388671875, 5.7950439453125, 6.11669921875, 6.4383544921875, 6.760009765625, 7.0816650390625, 7.4033203125, 7.7249755859375, 8.046630859375, 8.3682861328125, 8.68994140625, 9.0115966796875, 9.333251953125, 9.6549072265625, 9.9765625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 4.0, 5.0, 9.0, 12.0, 10.0, 9.0, 23.0, 16.0, 20.0, 18.0, 21.0, 19.0, 25.0, 31.0, 44.0, 32.0, 32.0, 38.0, 51.0, 74.0, 141.0, 505.0, 394.0, 75.0, 40.0, 30.0, 32.0, 36.0, 26.0, 31.0, 19.0, 18.0, 20.0, 19.0, 12.0, 23.0, 9.0, 16.0, 15.0, 17.0, 10.0, 7.0, 2.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.0703125, -4.90692138671875, -4.7435302734375, -4.58013916015625, -4.416748046875, -4.25335693359375, -4.0899658203125, -3.92657470703125, -3.76318359375, -3.59979248046875, -3.4364013671875, -3.27301025390625, -3.109619140625, -2.94622802734375, -2.7828369140625, -2.61944580078125, -2.4560546875, -2.29266357421875, -2.1292724609375, -1.96588134765625, -1.802490234375, -1.63909912109375, -1.4757080078125, -1.31231689453125, -1.14892578125, -0.98553466796875, -0.8221435546875, -0.65875244140625, -0.495361328125, -0.33197021484375, -0.1685791015625, -0.00518798828125, 0.158203125, 0.32159423828125, 0.4849853515625, 0.64837646484375, 0.811767578125, 0.97515869140625, 1.1385498046875, 1.30194091796875, 1.46533203125, 1.62872314453125, 1.7921142578125, 1.95550537109375, 2.118896484375, 2.28228759765625, 2.4456787109375, 2.60906982421875, 2.7724609375, 2.93585205078125, 3.0992431640625, 3.26263427734375, 3.426025390625, 3.58941650390625, 3.7528076171875, 3.91619873046875, 4.07958984375, 4.24298095703125, 4.4063720703125, 4.56976318359375, 4.733154296875, 4.89654541015625, 5.0599365234375, 5.22332763671875, 5.38671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 10.0, 9.0, 37.0, 80.0, 176.0, 309.0, 233.0, 98.0, 23.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.99706268310547, -43.09306335449219, -42.189064025878906, -41.285064697265625, -40.381065368652344, -39.47706604003906, -38.57306671142578, -37.669071197509766, -36.765071868896484, -35.8610725402832, -34.95707321166992, -34.05307388305664, -33.14907455444336, -32.245079040527344, -31.34107780456543, -30.43707847595215, -29.533079147338867, -28.629079818725586, -27.725080490112305, -26.821083068847656, -25.917083740234375, -25.013084411621094, -24.109085083007812, -23.20508575439453, -22.30108642578125, -21.39708709716797, -20.493087768554688, -19.589088439941406, -18.685091018676758, -17.781091690063477, -16.877092361450195, -15.973093032836914, -15.069096565246582, -14.1650972366333, -13.261098861694336, -12.357099533081055, -11.453100204467773, -10.549101829528809, -9.645102500915527, -8.741104125976562, -7.837104797363281, -6.933105945587158, -6.029107093811035, -5.125107765197754, -4.221108913421631, -3.317110061645508, -2.4131107330322266, -1.5091118812561035, -0.6051130294799805, 0.29888594150543213, 1.2028849124908447, 2.106884002685547, 3.01088285446167, 3.914881706237793, 4.818881034851074, 5.722879886627197, 6.62687873840332, 7.530877590179443, 8.434876441955566, 9.338875770568848, 10.242874145507812, 11.146873474121094, 12.050872802734375, 12.954872131347656, 13.858870506286621]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 17.0, 22.0, 24.0, 23.0, 38.0, 42.0, 39.0, 53.0, 70.0, 67.0, 61.0, 71.0, 77.0, 71.0, 73.0, 55.0, 48.0, 25.0, 28.0, 17.0, 14.0, 12.0, 14.0, 8.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.263928413391113, -14.757878303527832, -14.25182819366455, -13.74577808380127, -13.239728927612305, -12.733678817749023, -12.227628707885742, -11.721578598022461, -11.21552848815918, -10.709478378295898, -10.203428268432617, -9.697378158569336, -9.191328048706055, -8.685277938842773, -8.179228782653809, -7.673178672790527, -7.167128562927246, -6.661078453063965, -6.155028343200684, -5.6489787101745605, -5.142928600311279, -4.636878490447998, -4.130828857421875, -3.6247787475585938, -3.1187286376953125, -2.6126785278320312, -2.106628656387329, -1.6005786657333374, -1.0945286750793457, -0.5884785652160645, -0.0824286937713623, 0.42362117767333984, 0.9296722412109375, 1.4357222318649292, 1.941772222518921, 2.447822093963623, 2.9538722038269043, 3.4599223136901855, 3.9659721851348877, 4.47202205657959, 4.978072166442871, 5.484122276306152, 5.990172386169434, 6.496222019195557, 7.002272129058838, 7.508322238922119, 8.014371871948242, 8.520421981811523, 9.026472091674805, 9.532522201538086, 10.038572311401367, 10.544622421264648, 11.05067253112793, 11.556722640991211, 12.062771797180176, 12.568821907043457, 13.074872016906738, 13.58092212677002, 14.0869722366333, 14.593022346496582, 15.099071502685547, 15.605121612548828, 16.11117172241211, 16.61722183227539, 17.123271942138672]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 14.0, 10.0, 22.0, 34.0, 43.0, 51.0, 76.0, 112.0, 158.0, 208.0, 315.0, 482.0, 732.0, 1237.0, 1983.0, 3272.0, 6075.0, 12140.0, 29409.0, 105581.0, 3804638.0, 153821.0, 38835.0, 16019.0, 7727.0, 4329.0, 2527.0, 1543.0, 939.0, 611.0, 402.0, 282.0, 177.0, 130.0, 89.0, 69.0, 33.0, 42.0, 18.0, 22.0, 10.0, 16.0, 7.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2049560546875, -0.19803237915039062, -0.19110870361328125, -0.18418502807617188, -0.1772613525390625, -0.17033767700195312, -0.16341400146484375, -0.15649032592773438, -0.149566650390625, -0.14264297485351562, -0.13571929931640625, -0.12879562377929688, -0.1218719482421875, -0.11494827270507812, -0.10802459716796875, -0.10110092163085938, -0.09417724609375, -0.08725357055664062, -0.08032989501953125, -0.07340621948242188, -0.0664825439453125, -0.059558868408203125, -0.05263519287109375, -0.045711517333984375, -0.038787841796875, -0.031864166259765625, -0.02494049072265625, -0.018016815185546875, -0.0110931396484375, -0.004169464111328125, 0.00275421142578125, 0.009677886962890625, 0.0166015625, 0.023525238037109375, 0.03044891357421875, 0.037372589111328125, 0.0442962646484375, 0.051219940185546875, 0.05814361572265625, 0.06506729125976562, 0.071990966796875, 0.07891464233398438, 0.08583831787109375, 0.09276199340820312, 0.0996856689453125, 0.10660934448242188, 0.11353302001953125, 0.12045669555664062, 0.12738037109375, 0.13430404663085938, 0.14122772216796875, 0.14815139770507812, 0.1550750732421875, 0.16199874877929688, 0.16892242431640625, 0.17584609985351562, 0.182769775390625, 0.18969345092773438, 0.19661712646484375, 0.20354080200195312, 0.2104644775390625, 0.21738815307617188, 0.22431182861328125, 0.23123550415039062, 0.2381591796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 8.0, 5.0, 10.0, 15.0, 19.0, 20.0, 44.0, 751.0, 19.0, 20.0, 17.0, 6.0, 8.0, 3.0, 7.0, 3.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06097412109375, -0.05882549285888672, -0.05667686462402344, -0.054528236389160156, -0.052379608154296875, -0.050230979919433594, -0.04808235168457031, -0.04593372344970703, -0.04378509521484375, -0.04163646697998047, -0.03948783874511719, -0.037339210510253906, -0.035190582275390625, -0.033041954040527344, -0.030893325805664062, -0.02874469757080078, -0.0265960693359375, -0.02444744110107422, -0.022298812866210938, -0.020150184631347656, -0.018001556396484375, -0.015852928161621094, -0.013704299926757812, -0.011555671691894531, -0.00940704345703125, -0.007258415222167969, -0.0051097869873046875, -0.0029611587524414062, -0.000812530517578125, 0.0013360977172851562, 0.0034847259521484375, 0.005633354187011719, 0.007781982421875, 0.009930610656738281, 0.012079238891601562, 0.014227867126464844, 0.016376495361328125, 0.018525123596191406, 0.020673751831054688, 0.02282238006591797, 0.02497100830078125, 0.02711963653564453, 0.029268264770507812, 0.031416893005371094, 0.033565521240234375, 0.035714149475097656, 0.03786277770996094, 0.04001140594482422, 0.0421600341796875, 0.04430866241455078, 0.04645729064941406, 0.048605918884277344, 0.050754547119140625, 0.052903175354003906, 0.05505180358886719, 0.05720043182373047, 0.05934906005859375, 0.06149768829345703, 0.06364631652832031, 0.0657949447631836, 0.06794357299804688, 0.07009220123291016, 0.07224082946777344, 0.07438945770263672, 0.0765380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 11.0, 10.0, 12.0, 28.0, 31.0, 52.0, 76.0, 145.0, 272.0, 430.0, 894.0, 1901.0, 4254.0, 10652.0, 30840.0, 106418.0, 517918.0, 2725018.0, 622595.0, 119964.0, 33609.0, 11176.0, 4300.0, 1873.0, 865.0, 380.0, 232.0, 118.0, 66.0, 49.0, 30.0, 18.0, 21.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223876953125, -0.21757888793945312, -0.21128082275390625, -0.20498275756835938, -0.1986846923828125, -0.19238662719726562, -0.18608856201171875, -0.17979049682617188, -0.173492431640625, -0.16719436645507812, -0.16089630126953125, -0.15459823608398438, -0.1483001708984375, -0.14200210571289062, -0.13570404052734375, -0.12940597534179688, -0.12310791015625, -0.11680984497070312, -0.11051177978515625, -0.10421371459960938, -0.0979156494140625, -0.09161758422851562, -0.08531951904296875, -0.07902145385742188, -0.072723388671875, -0.06642532348632812, -0.06012725830078125, -0.053829193115234375, -0.0475311279296875, -0.041233062744140625, -0.03493499755859375, -0.028636932373046875, -0.0223388671875, -0.016040802001953125, -0.00974273681640625, -0.003444671630859375, 0.0028533935546875, 0.009151458740234375, 0.01544952392578125, 0.021747589111328125, 0.028045654296875, 0.034343719482421875, 0.04064178466796875, 0.046939849853515625, 0.0532379150390625, 0.059535980224609375, 0.06583404541015625, 0.07213211059570312, 0.07843017578125, 0.08472824096679688, 0.09102630615234375, 0.09732437133789062, 0.1036224365234375, 0.10992050170898438, 0.11621856689453125, 0.12251663208007812, 0.128814697265625, 0.13511276245117188, 0.14141082763671875, 0.14770889282226562, 0.1540069580078125, 0.16030502319335938, 0.16660308837890625, 0.17290115356445312, 0.17919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 9.0, 18.0, 30.0, 28.0, 42.0, 44.0, 89.0, 85.0, 127.0, 205.0, 287.0, 476.0, 777.0, 656.0, 367.0, 235.0, 172.0, 97.0, 69.0, 45.0, 55.0, 32.0, 23.0, 22.0, 16.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0823974609375, -0.08009052276611328, -0.07778358459472656, -0.07547664642333984, -0.07316970825195312, -0.0708627700805664, -0.06855583190917969, -0.06624889373779297, -0.06394195556640625, -0.06163501739501953, -0.05932807922363281, -0.057021141052246094, -0.054714202880859375, -0.052407264709472656, -0.05010032653808594, -0.04779338836669922, -0.0454864501953125, -0.04317951202392578, -0.04087257385253906, -0.038565635681152344, -0.036258697509765625, -0.033951759338378906, -0.03164482116699219, -0.02933788299560547, -0.02703094482421875, -0.02472400665283203, -0.022417068481445312, -0.020110130310058594, -0.017803192138671875, -0.015496253967285156, -0.013189315795898438, -0.010882377624511719, -0.008575439453125, -0.006268501281738281, -0.0039615631103515625, -0.0016546249389648438, 0.000652313232421875, 0.0029592514038085938, 0.0052661895751953125, 0.007573127746582031, 0.00988006591796875, 0.012187004089355469, 0.014493942260742188, 0.016800880432128906, 0.019107818603515625, 0.021414756774902344, 0.023721694946289062, 0.02602863311767578, 0.0283355712890625, 0.03064250946044922, 0.03294944763183594, 0.035256385803222656, 0.037563323974609375, 0.039870262145996094, 0.04217720031738281, 0.04448413848876953, 0.04679107666015625, 0.04909801483154297, 0.05140495300292969, 0.053711891174316406, 0.056018829345703125, 0.058325767517089844, 0.06063270568847656, 0.06293964385986328, 0.06524658203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 14.0, 28.0, 37.0, 79.0, 143.0, 207.0, 226.0, 145.0, 58.0, 39.0, 15.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7778091430664062, -0.7519026398658752, -0.7259961366653442, -0.700089693069458, -0.674183189868927, -0.648276686668396, -0.622370183467865, -0.596463680267334, -0.5705572366714478, -0.5446507334709167, -0.5187442302703857, -0.4928377568721771, -0.4669312834739685, -0.4410247802734375, -0.4151182770729065, -0.3892117738723755, -0.3633052706718445, -0.3373987674713135, -0.31149229407310486, -0.28558579087257385, -0.25967931747436523, -0.23377281427383423, -0.20786631107330322, -0.1819598227739334, -0.1560533344745636, -0.1301468461751938, -0.10424035042524338, -0.07833385467529297, -0.05242736637592316, -0.026520878076553345, -0.0006143748760223389, 0.025292113423347473, 0.05119854211807251, 0.07710503041744232, 0.10301152616739273, 0.12891802191734314, 0.15482451021671295, 0.18073099851608276, 0.20663750171661377, 0.23254399001598358, 0.2584504783153534, 0.2843569815158844, 0.310263454914093, 0.336169958114624, 0.36207646131515503, 0.38798293471336365, 0.41388943791389465, 0.43979591131210327, 0.4657024145126343, 0.4916089177131653, 0.5175154209136963, 0.5434218645095825, 0.5693283677101135, 0.5952348709106445, 0.6211413741111755, 0.6470478773117065, 0.6729543209075928, 0.6988608241081238, 0.7247673273086548, 0.750673770904541, 0.776580274105072, 0.802486777305603, 0.828393280506134, 0.854299783706665, 0.880206286907196]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 8.0, 19.0, 20.0, 22.0, 30.0, 36.0, 35.0, 47.0, 54.0, 61.0, 59.0, 67.0, 78.0, 70.0, 60.0, 61.0, 56.0, 56.0, 26.0, 30.0, 20.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38632452487945557, -0.37400761246681213, -0.3616907000541687, -0.34937378764152527, -0.33705687522888184, -0.3247399628162384, -0.31242305040359497, -0.30010613799095154, -0.2877892255783081, -0.2754723131656647, -0.26315540075302124, -0.2508384883403778, -0.23852157592773438, -0.22620466351509094, -0.2138877511024475, -0.20157083868980408, -0.18925391137599945, -0.17693699896335602, -0.16462008655071259, -0.15230317413806915, -0.13998626172542572, -0.1276693493127823, -0.11535242944955826, -0.10303551703691483, -0.09071860462427139, -0.07840169221162796, -0.06608477979898453, -0.053767863661050797, -0.041450951248407364, -0.02913403883576393, -0.0168171226978302, -0.004500210285186768, 0.007816702127456665, 0.020133614540100098, 0.03245052695274353, 0.04476744309067726, 0.057084355503320694, 0.06940126419067383, 0.08171818405389786, 0.09403509646654129, 0.10635200887918472, 0.11866892129182816, 0.13098584115505219, 0.14330275356769562, 0.15561966598033905, 0.16793657839298248, 0.18025349080562592, 0.19257040321826935, 0.20488731563091278, 0.2172042280435562, 0.22952114045619965, 0.24183805286884308, 0.2541549801826477, 0.26647189259529114, 0.27878880500793457, 0.291105717420578, 0.30342262983322144, 0.31573954224586487, 0.3280564546585083, 0.34037336707115173, 0.35269027948379517, 0.3650071918964386, 0.37732410430908203, 0.38964101672172546, 0.4019579291343689]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 8.0, 13.0, 5.0, 17.0, 17.0, 34.0, 44.0, 63.0, 79.0, 128.0, 180.0, 261.0, 422.0, 617.0, 890.0, 1479.0, 2346.0, 3811.0, 6338.0, 12112.0, 25601.0, 226965.0, 699391.0, 33924.0, 14625.0, 7580.0, 4351.0, 2621.0, 1639.0, 967.0, 688.0, 408.0, 286.0, 192.0, 125.0, 97.0, 66.0, 45.0, 36.0, 19.0, 25.0, 13.0, 8.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.31787109375, -0.3079795837402344, -0.29808807373046875, -0.2881965637207031, -0.2783050537109375, -0.2684135437011719, -0.25852203369140625, -0.24863052368164062, -0.238739013671875, -0.22884750366210938, -0.21895599365234375, -0.20906448364257812, -0.1991729736328125, -0.18928146362304688, -0.17938995361328125, -0.16949844360351562, -0.15960693359375, -0.14971542358398438, -0.13982391357421875, -0.12993240356445312, -0.1200408935546875, -0.11014938354492188, -0.10025787353515625, -0.09036636352539062, -0.080474853515625, -0.07058334350585938, -0.06069183349609375, -0.050800323486328125, -0.0409088134765625, -0.031017303466796875, -0.02112579345703125, -0.011234283447265625, -0.0013427734375, 0.008548736572265625, 0.01844024658203125, 0.028331756591796875, 0.0382232666015625, 0.048114776611328125, 0.05800628662109375, 0.06789779663085938, 0.077789306640625, 0.08768081665039062, 0.09757232666015625, 0.10746383666992188, 0.1173553466796875, 0.12724685668945312, 0.13713836669921875, 0.14702987670898438, 0.15692138671875, 0.16681289672851562, 0.17670440673828125, 0.18659591674804688, 0.1964874267578125, 0.20637893676757812, 0.21627044677734375, 0.22616195678710938, 0.236053466796875, 0.24594497680664062, 0.25583648681640625, 0.2657279968261719, 0.2756195068359375, 0.2855110168457031, 0.29540252685546875, 0.3052940368652344, 0.315185546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 12.0, 13.0, 19.0, 26.0, 181.0, 426.0, 184.0, 31.0, 15.0, 8.0, 8.0, 9.0, 2.0, 3.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0614013671875, -0.05939292907714844, -0.057384490966796875, -0.05537605285644531, -0.05336761474609375, -0.05135917663574219, -0.049350738525390625, -0.04734230041503906, -0.0453338623046875, -0.04332542419433594, -0.041316986083984375, -0.03930854797363281, -0.03730010986328125, -0.03529167175292969, -0.033283233642578125, -0.03127479553222656, -0.029266357421875, -0.027257919311523438, -0.025249481201171875, -0.023241043090820312, -0.02123260498046875, -0.019224166870117188, -0.017215728759765625, -0.015207290649414062, -0.0131988525390625, -0.011190414428710938, -0.009181976318359375, -0.0071735382080078125, -0.00516510009765625, -0.0031566619873046875, -0.001148223876953125, 0.0008602142333984375, 0.00286865234375, 0.0048770904541015625, 0.006885528564453125, 0.008893966674804688, 0.01090240478515625, 0.012910842895507812, 0.014919281005859375, 0.016927719116210938, 0.0189361572265625, 0.020944595336914062, 0.022953033447265625, 0.024961471557617188, 0.02696990966796875, 0.028978347778320312, 0.030986785888671875, 0.03299522399902344, 0.035003662109375, 0.03701210021972656, 0.039020538330078125, 0.04102897644042969, 0.04303741455078125, 0.04504585266113281, 0.047054290771484375, 0.04906272888183594, 0.0510711669921875, 0.05307960510253906, 0.055088043212890625, 0.05709648132324219, 0.05910491943359375, 0.06111335754394531, 0.06312179565429688, 0.06513023376464844, 0.067138671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 11.0, 13.0, 11.0, 19.0, 26.0, 36.0, 51.0, 86.0, 141.0, 211.0, 306.0, 557.0, 1038.0, 2093.0, 5188.0, 14830.0, 52014.0, 218862.0, 507783.0, 180027.0, 43579.0, 12728.0, 4606.0, 1982.0, 945.0, 527.0, 304.0, 165.0, 131.0, 97.0, 41.0, 45.0, 24.0, 21.0, 12.0, 5.0, 5.0, 9.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3056640625, -0.2967872619628906, -0.28791046142578125, -0.2790336608886719, -0.2701568603515625, -0.2612800598144531, -0.25240325927734375, -0.24352645874023438, -0.234649658203125, -0.22577285766601562, -0.21689605712890625, -0.20801925659179688, -0.1991424560546875, -0.19026565551757812, -0.18138885498046875, -0.17251205444335938, -0.16363525390625, -0.15475845336914062, -0.14588165283203125, -0.13700485229492188, -0.1281280517578125, -0.11925125122070312, -0.11037445068359375, -0.10149765014648438, -0.092620849609375, -0.08374404907226562, -0.07486724853515625, -0.06599044799804688, -0.0571136474609375, -0.048236846923828125, -0.03936004638671875, -0.030483245849609375, -0.0216064453125, -0.012729644775390625, -0.00385284423828125, 0.005023956298828125, 0.0139007568359375, 0.022777557373046875, 0.03165435791015625, 0.040531158447265625, 0.049407958984375, 0.058284759521484375, 0.06716156005859375, 0.07603836059570312, 0.0849151611328125, 0.09379196166992188, 0.10266876220703125, 0.11154556274414062, 0.12042236328125, 0.12929916381835938, 0.13817596435546875, 0.14705276489257812, 0.1559295654296875, 0.16480636596679688, 0.17368316650390625, 0.18255996704101562, 0.191436767578125, 0.20031356811523438, 0.20919036865234375, 0.21806716918945312, 0.2269439697265625, 0.23582077026367188, 0.24469757080078125, 0.2535743713378906, 0.262451171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 11.0, 14.0, 21.0, 25.0, 21.0, 28.0, 29.0, 31.0, 34.0, 41.0, 51.0, 46.0, 41.0, 48.0, 46.0, 52.0, 50.0, 45.0, 47.0, 27.0, 42.0, 34.0, 37.0, 34.0, 19.0, 23.0, 13.0, 15.0, 13.0, 8.0, 2.0, 9.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24493789672851562, -0.23670196533203125, -0.22846603393554688, -0.2202301025390625, -0.21199417114257812, -0.20375823974609375, -0.19552230834960938, -0.187286376953125, -0.17905044555664062, -0.17081451416015625, -0.16257858276367188, -0.1543426513671875, -0.14610671997070312, -0.13787078857421875, -0.12963485717773438, -0.12139892578125, -0.11316299438476562, -0.10492706298828125, -0.09669113159179688, -0.0884552001953125, -0.08021926879882812, -0.07198333740234375, -0.06374740600585938, -0.055511474609375, -0.047275543212890625, -0.03903961181640625, -0.030803680419921875, -0.0225677490234375, -0.014331817626953125, -0.00609588623046875, 0.002140045166015625, 0.0103759765625, 0.018611907958984375, 0.02684783935546875, 0.035083770751953125, 0.0433197021484375, 0.051555633544921875, 0.05979156494140625, 0.06802749633789062, 0.076263427734375, 0.08449935913085938, 0.09273529052734375, 0.10097122192382812, 0.1092071533203125, 0.11744308471679688, 0.12567901611328125, 0.13391494750976562, 0.14215087890625, 0.15038681030273438, 0.15862274169921875, 0.16685867309570312, 0.1750946044921875, 0.18333053588867188, 0.19156646728515625, 0.19980239868164062, 0.208038330078125, 0.21627426147460938, 0.22451019287109375, 0.23274612426757812, 0.2409820556640625, 0.24921798706054688, 0.25745391845703125, 0.2656898498535156, 0.27392578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 4.0, 5.0, 11.0, 10.0, 18.0, 24.0, 52.0, 62.0, 98.0, 176.0, 272.0, 529.0, 1157.0, 2838.0, 8840.0, 60830.0, 877939.0, 80101.0, 9944.0, 3124.0, 1210.0, 544.0, 290.0, 151.0, 83.0, 72.0, 50.0, 44.0, 25.0, 18.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.505828857421875, -0.48870849609375, -0.471588134765625, -0.4544677734375, -0.437347412109375, -0.42022705078125, -0.403106689453125, -0.385986328125, -0.368865966796875, -0.35174560546875, -0.334625244140625, -0.3175048828125, -0.300384521484375, -0.28326416015625, -0.266143798828125, -0.2490234375, -0.231903076171875, -0.21478271484375, -0.197662353515625, -0.1805419921875, -0.163421630859375, -0.14630126953125, -0.129180908203125, -0.112060546875, -0.094940185546875, -0.07781982421875, -0.060699462890625, -0.0435791015625, -0.026458740234375, -0.00933837890625, 0.007781982421875, 0.02490234375, 0.042022705078125, 0.05914306640625, 0.076263427734375, 0.0933837890625, 0.110504150390625, 0.12762451171875, 0.144744873046875, 0.161865234375, 0.178985595703125, 0.19610595703125, 0.213226318359375, 0.2303466796875, 0.247467041015625, 0.26458740234375, 0.281707763671875, 0.298828125, 0.315948486328125, 0.33306884765625, 0.350189208984375, 0.3673095703125, 0.384429931640625, 0.40155029296875, 0.418670654296875, 0.435791015625, 0.452911376953125, 0.47003173828125, 0.487152099609375, 0.5042724609375, 0.521392822265625, 0.53851318359375, 0.555633544921875, 0.57275390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 1.0, 8.0, 6.0, 11.0, 15.0, 18.0, 28.0, 35.0, 51.0, 46.0, 70.0, 59.0, 73.0, 58.0, 100.0, 75.0, 59.0, 51.0, 43.0, 33.0, 39.0, 24.0, 21.0, 7.0, 15.0, 9.0, 5.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.722574234008789e-05, -1.6555190086364746e-05, -1.58846378326416e-05, -1.5214085578918457e-05, -1.4543533325195312e-05, -1.3872981071472168e-05, -1.3202428817749023e-05, -1.2531876564025879e-05, -1.1861324310302734e-05, -1.119077205657959e-05, -1.0520219802856445e-05, -9.8496675491333e-06, -9.179115295410156e-06, -8.508563041687012e-06, -7.838010787963867e-06, -7.167458534240723e-06, -6.496906280517578e-06, -5.826354026794434e-06, -5.155801773071289e-06, -4.4852495193481445e-06, -3.814697265625e-06, -3.1441450119018555e-06, -2.473592758178711e-06, -1.8030405044555664e-06, -1.1324882507324219e-06, -4.6193599700927734e-07, 2.086162567138672e-07, 8.791685104370117e-07, 1.5497207641601562e-06, 2.2202730178833008e-06, 2.8908252716064453e-06, 3.56137752532959e-06, 4.231929779052734e-06, 4.902482032775879e-06, 5.5730342864990234e-06, 6.243586540222168e-06, 6.9141387939453125e-06, 7.584691047668457e-06, 8.255243301391602e-06, 8.925795555114746e-06, 9.59634780883789e-06, 1.0266900062561035e-05, 1.093745231628418e-05, 1.1608004570007324e-05, 1.2278556823730469e-05, 1.2949109077453613e-05, 1.3619661331176758e-05, 1.4290213584899902e-05, 1.4960765838623047e-05, 1.563131809234619e-05, 1.6301870346069336e-05, 1.697242259979248e-05, 1.7642974853515625e-05, 1.831352710723877e-05, 1.8984079360961914e-05, 1.965463161468506e-05, 2.0325183868408203e-05, 2.0995736122131348e-05, 2.1666288375854492e-05, 2.2336840629577637e-05, 2.300739288330078e-05, 2.3677945137023926e-05, 2.434849739074707e-05, 2.5019049644470215e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 5.0, 17.0, 23.0, 25.0, 51.0, 62.0, 91.0, 113.0, 201.0, 291.0, 410.0, 741.0, 1351.0, 2493.0, 4686.0, 10600.0, 26936.0, 82704.0, 312472.0, 426013.0, 116963.0, 35916.0, 13589.0, 6000.0, 2900.0, 1555.0, 845.0, 516.0, 305.0, 207.0, 128.0, 97.0, 73.0, 47.0, 30.0, 22.0, 16.0, 13.0, 5.0, 5.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.23828125, -0.23109054565429688, -0.22389984130859375, -0.21670913696289062, -0.2095184326171875, -0.20232772827148438, -0.19513702392578125, -0.18794631958007812, -0.180755615234375, -0.17356491088867188, -0.16637420654296875, -0.15918350219726562, -0.1519927978515625, -0.14480209350585938, -0.13761138916015625, -0.13042068481445312, -0.12322998046875, -0.11603927612304688, -0.10884857177734375, -0.10165786743164062, -0.0944671630859375, -0.08727645874023438, -0.08008575439453125, -0.07289505004882812, -0.065704345703125, -0.058513641357421875, -0.05132293701171875, -0.044132232666015625, -0.0369415283203125, -0.029750823974609375, -0.02256011962890625, -0.015369415283203125, -0.0081787109375, -0.000988006591796875, 0.00620269775390625, 0.013393402099609375, 0.0205841064453125, 0.027774810791015625, 0.03496551513671875, 0.042156219482421875, 0.049346923828125, 0.056537628173828125, 0.06372833251953125, 0.07091903686523438, 0.0781097412109375, 0.08530044555664062, 0.09249114990234375, 0.09968185424804688, 0.10687255859375, 0.11406326293945312, 0.12125396728515625, 0.12844467163085938, 0.1356353759765625, 0.14282608032226562, 0.15001678466796875, 0.15720748901367188, 0.164398193359375, 0.17158889770507812, 0.17877960205078125, 0.18597030639648438, 0.1931610107421875, 0.20035171508789062, 0.20754241943359375, 0.21473312377929688, 0.221923828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 12.0, 16.0, 15.0, 26.0, 35.0, 28.0, 38.0, 49.0, 44.0, 62.0, 77.0, 71.0, 69.0, 56.0, 50.0, 58.0, 47.0, 48.0, 30.0, 27.0, 20.0, 35.0, 12.0, 10.0, 7.0, 9.0, 4.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19755172729492188, -0.19026947021484375, -0.18298721313476562, -0.1757049560546875, -0.16842269897460938, -0.16114044189453125, -0.15385818481445312, -0.146575927734375, -0.13929367065429688, -0.13201141357421875, -0.12472915649414062, -0.1174468994140625, -0.11016464233398438, -0.10288238525390625, -0.09560012817382812, -0.08831787109375, -0.08103561401367188, -0.07375335693359375, -0.06647109985351562, -0.0591888427734375, -0.051906585693359375, -0.04462432861328125, -0.037342071533203125, -0.030059814453125, -0.022777557373046875, -0.01549530029296875, -0.008213043212890625, -0.0009307861328125, 0.006351470947265625, 0.01363372802734375, 0.020915985107421875, 0.0281982421875, 0.035480499267578125, 0.04276275634765625, 0.050045013427734375, 0.0573272705078125, 0.06460952758789062, 0.07189178466796875, 0.07917404174804688, 0.086456298828125, 0.09373855590820312, 0.10102081298828125, 0.10830307006835938, 0.1155853271484375, 0.12286758422851562, 0.13014984130859375, 0.13743209838867188, 0.14471435546875, 0.15199661254882812, 0.15927886962890625, 0.16656112670898438, 0.1738433837890625, 0.18112564086914062, 0.18840789794921875, 0.19569015502929688, 0.202972412109375, 0.21025466918945312, 0.21753692626953125, 0.22481918334960938, 0.2321014404296875, 0.23938369750976562, 0.24666595458984375, 0.2539482116699219, 0.26123046875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 18.0, 25.0, 83.0, 195.0, 336.0, 200.0, 74.0, 25.0, 13.0, 6.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.972434043884277, -4.819847106933594, -4.667260646820068, -4.514673709869385, -4.362086772918701, -4.209499835968018, -4.056913375854492, -3.9043264389038086, -3.751739501953125, -3.5991528034210205, -3.446565866470337, -3.2939791679382324, -3.141392230987549, -2.9888055324554443, -2.83621883392334, -2.6836318969726562, -2.5310451984405518, -2.3784584999084473, -2.2258715629577637, -2.073284864425659, -1.9206979274749756, -1.768111228942871, -1.615524411201477, -1.462937593460083, -1.310350775718689, -1.157763957977295, -1.0051771402359009, -0.8525903820991516, -0.7000035643577576, -0.5474167466163635, -0.39482998847961426, -0.24224317073822021, -0.08965635299682617, 0.06293044984340668, 0.21551725268363953, 0.3681040406227112, 0.5206908583641052, 0.6732776761054993, 0.8258644342422485, 0.9784512519836426, 1.1310380697250366, 1.2836248874664307, 1.4362117052078247, 1.5887985229492188, 1.7413852214813232, 1.8939721584320068, 2.0465588569641113, 2.199145793914795, 2.3517324924468994, 2.504319190979004, 2.6569061279296875, 2.809492826461792, 2.9620797634124756, 3.11466646194458, 3.2672533988952637, 3.419840097427368, 3.5724267959594727, 3.725013494491577, 3.8776004314422607, 4.030187129974365, 4.182774066925049, 4.335361003875732, 4.487947463989258, 4.640534400939941, 4.793121337890625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 5.0, 7.0, 8.0, 17.0, 23.0, 32.0, 60.0, 93.0, 153.0, 168.0, 145.0, 96.0, 52.0, 43.0, 24.0, 12.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.309418201446533, -5.1514363288879395, -4.993454933166504, -4.83547306060791, -4.677491188049316, -4.519509315490723, -4.361527442932129, -4.203546047210693, -4.0455641746521, -3.887582302093506, -3.729600667953491, -3.5716190338134766, -3.413637161254883, -3.255655288696289, -3.0976736545562744, -2.9396920204162598, -2.781710147857666, -2.6237282752990723, -2.4657466411590576, -2.307765007019043, -2.149783134460449, -1.991801381111145, -1.8338196277618408, -1.6758378744125366, -1.5178561210632324, -1.3598743677139282, -1.201892614364624, -1.0439108610153198, -0.8859291076660156, -0.7279473543167114, -0.5699656009674072, -0.411983847618103, -0.25400257110595703, -0.09602081775665283, 0.06196093559265137, 0.21994268894195557, 0.37792444229125977, 0.535906195640564, 0.6938879489898682, 0.8518697023391724, 1.0098514556884766, 1.1678332090377808, 1.325814962387085, 1.4837967157363892, 1.6417784690856934, 1.7997602224349976, 1.9577419757843018, 2.1157236099243164, 2.27370548248291, 2.431687355041504, 2.5896689891815186, 2.747650623321533, 2.905632495880127, 3.0636143684387207, 3.2215960025787354, 3.37957763671875, 3.5375595092773438, 3.6955413818359375, 3.853523015975952, 4.011504650115967, 4.1694865226745605, 4.327468395233154, 4.48544979095459, 4.643431663513184, 4.801413536071777]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 13.0, 8.0, 9.0, 7.0, 13.0, 21.0, 34.0, 82.0, 260.0, 1243.0, 9365.0, 654588.0, 3512291.0, 13534.0, 2011.0, 478.0, 156.0, 60.0, 28.0, 18.0, 14.0, 8.0, 11.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.729522705078125, -1.66998291015625, -1.610443115234375, -1.5509033203125, -1.491363525390625, -1.43182373046875, -1.372283935546875, -1.312744140625, -1.253204345703125, -1.19366455078125, -1.134124755859375, -1.0745849609375, -1.015045166015625, -0.95550537109375, -0.895965576171875, -0.83642578125, -0.776885986328125, -0.71734619140625, -0.657806396484375, -0.5982666015625, -0.538726806640625, -0.47918701171875, -0.419647216796875, -0.360107421875, -0.300567626953125, -0.24102783203125, -0.181488037109375, -0.1219482421875, -0.062408447265625, -0.00286865234375, 0.056671142578125, 0.1162109375, 0.175750732421875, 0.23529052734375, 0.294830322265625, 0.3543701171875, 0.413909912109375, 0.47344970703125, 0.532989501953125, 0.592529296875, 0.652069091796875, 0.71160888671875, 0.771148681640625, 0.8306884765625, 0.890228271484375, 0.94976806640625, 1.009307861328125, 1.06884765625, 1.128387451171875, 1.18792724609375, 1.247467041015625, 1.3070068359375, 1.366546630859375, 1.42608642578125, 1.485626220703125, 1.545166015625, 1.604705810546875, 1.66424560546875, 1.723785400390625, 1.7833251953125, 1.842864990234375, 1.90240478515625, 1.961944580078125, 2.021484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 13.0, 10.0, 29.0, 58.0, 108.0, 169.0, 191.0, 150.0, 61.0, 55.0, 16.0, 11.0, 5.0, 5.0, 13.0, 12.0, 6.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.034820556640625, -0.033509254455566406, -0.03219795227050781, -0.03088665008544922, -0.029575347900390625, -0.02826404571533203, -0.026952743530273438, -0.025641441345214844, -0.02433013916015625, -0.023018836975097656, -0.021707534790039062, -0.02039623260498047, -0.019084930419921875, -0.01777362823486328, -0.016462326049804688, -0.015151023864746094, -0.0138397216796875, -0.012528419494628906, -0.011217117309570312, -0.009905815124511719, -0.008594512939453125, -0.007283210754394531, -0.0059719085693359375, -0.004660606384277344, -0.00334930419921875, -0.0020380020141601562, -0.0007266998291015625, 0.0005846023559570312, 0.001895904541015625, 0.0032072067260742188, 0.0045185089111328125, 0.005829811096191406, 0.00714111328125, 0.008452415466308594, 0.009763717651367188, 0.011075019836425781, 0.012386322021484375, 0.013697624206542969, 0.015008926391601562, 0.016320228576660156, 0.01763153076171875, 0.018942832946777344, 0.020254135131835938, 0.02156543731689453, 0.022876739501953125, 0.02418804168701172, 0.025499343872070312, 0.026810646057128906, 0.0281219482421875, 0.029433250427246094, 0.030744552612304688, 0.03205585479736328, 0.033367156982421875, 0.03467845916748047, 0.03598976135253906, 0.037301063537597656, 0.03861236572265625, 0.039923667907714844, 0.04123497009277344, 0.04254627227783203, 0.043857574462890625, 0.04516887664794922, 0.04648017883300781, 0.047791481018066406, 0.049102783203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 7.0, 12.0, 7.0, 18.0, 33.0, 33.0, 72.0, 81.0, 130.0, 180.0, 306.0, 601.0, 1145.0, 2458.0, 6579.0, 21231.0, 97273.0, 1304138.0, 2593578.0, 127856.0, 25318.0, 7466.0, 2806.0, 1278.0, 670.0, 354.0, 216.0, 132.0, 104.0, 56.0, 40.0, 27.0, 20.0, 12.0, 10.0, 12.0, 6.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4259223937988281, -0.41019439697265625, -0.3944664001464844, -0.3787384033203125, -0.3630104064941406, -0.34728240966796875, -0.3315544128417969, -0.315826416015625, -0.3000984191894531, -0.28437042236328125, -0.2686424255371094, -0.2529144287109375, -0.23718643188476562, -0.22145843505859375, -0.20573043823242188, -0.19000244140625, -0.17427444458007812, -0.15854644775390625, -0.14281845092773438, -0.1270904541015625, -0.11136245727539062, -0.09563446044921875, -0.07990646362304688, -0.064178466796875, -0.048450469970703125, -0.03272247314453125, -0.016994476318359375, -0.0012664794921875, 0.014461517333984375, 0.03018951416015625, 0.045917510986328125, 0.0616455078125, 0.07737350463867188, 0.09310150146484375, 0.10882949829101562, 0.1245574951171875, 0.14028549194335938, 0.15601348876953125, 0.17174148559570312, 0.187469482421875, 0.20319747924804688, 0.21892547607421875, 0.23465347290039062, 0.2503814697265625, 0.2661094665527344, 0.28183746337890625, 0.2975654602050781, 0.31329345703125, 0.3290214538574219, 0.34474945068359375, 0.3604774475097656, 0.3762054443359375, 0.3919334411621094, 0.40766143798828125, 0.4233894348144531, 0.439117431640625, 0.4548454284667969, 0.47057342529296875, 0.4863014221191406, 0.5020294189453125, 0.5177574157714844, 0.5334854125976562, 0.5492134094238281, 0.56494140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 13.0, 24.0, 15.0, 29.0, 39.0, 67.0, 97.0, 173.0, 337.0, 856.0, 1486.0, 475.0, 191.0, 92.0, 69.0, 23.0, 29.0, 14.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06597900390625, -0.06301498413085938, -0.06005096435546875, -0.057086944580078125, -0.0541229248046875, -0.051158905029296875, -0.04819488525390625, -0.045230865478515625, -0.042266845703125, -0.039302825927734375, -0.03633880615234375, -0.033374786376953125, -0.0304107666015625, -0.027446746826171875, -0.02448272705078125, -0.021518707275390625, -0.0185546875, -0.015590667724609375, -0.01262664794921875, -0.009662628173828125, -0.0066986083984375, -0.003734588623046875, -0.00077056884765625, 0.002193450927734375, 0.005157470703125, 0.008121490478515625, 0.01108551025390625, 0.014049530029296875, 0.0170135498046875, 0.019977569580078125, 0.02294158935546875, 0.025905609130859375, 0.02886962890625, 0.031833648681640625, 0.03479766845703125, 0.037761688232421875, 0.0407257080078125, 0.043689727783203125, 0.04665374755859375, 0.049617767333984375, 0.052581787109375, 0.055545806884765625, 0.05850982666015625, 0.061473846435546875, 0.0644378662109375, 0.06740188598632812, 0.07036590576171875, 0.07332992553710938, 0.0762939453125, 0.07925796508789062, 0.08222198486328125, 0.08518600463867188, 0.0881500244140625, 0.09111404418945312, 0.09407806396484375, 0.09704208374023438, 0.100006103515625, 0.10297012329101562, 0.10593414306640625, 0.10889816284179688, 0.1118621826171875, 0.11482620239257812, 0.11779022216796875, 0.12075424194335938, 0.12371826171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 10.0, 9.0, 20.0, 57.0, 162.0, 391.0, 267.0, 58.0, 16.0, 9.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6056296825408936, -1.5581352710723877, -1.5106408596038818, -1.463146448135376, -1.4156520366668701, -1.3681575059890747, -1.3206630945205688, -1.273168683052063, -1.2256742715835571, -1.1781798601150513, -1.1306854486465454, -1.0831910371780396, -1.0356965065002441, -0.9882021546363831, -0.9407076835632324, -0.8932132720947266, -0.8457188606262207, -0.7982244491577148, -0.750730037689209, -0.7032355666160583, -0.6557411551475525, -0.6082467436790466, -0.560752272605896, -0.5132578611373901, -0.4657634496688843, -0.4182690382003784, -0.37077459692955017, -0.3232801556587219, -0.27578574419021606, -0.228291317820549, -0.18079689145088196, -0.1333024501800537, -0.08580803871154785, -0.0383136123418808, 0.009180814027786255, 0.05667524039745331, 0.10416966676712036, 0.15166409313678741, 0.19915851950645447, 0.24665296077728271, 0.2941473722457886, 0.34164178371429443, 0.3891362249851227, 0.4366306662559509, 0.4841250777244568, 0.5316194891929626, 0.5791139602661133, 0.6266083717346191, 0.674102783203125, 0.7215971946716309, 0.7690916061401367, 0.8165860772132874, 0.8640804886817932, 0.9115749001502991, 0.9590693712234497, 1.0065637826919556, 1.0540581941604614, 1.1015526056289673, 1.1490470170974731, 1.196541428565979, 1.2440359592437744, 1.2915303707122803, 1.3390247821807861, 1.386519193649292, 1.4340136051177979]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 14.0, 14.0, 19.0, 17.0, 18.0, 33.0, 32.0, 50.0, 52.0, 68.0, 74.0, 82.0, 82.0, 69.0, 64.0, 74.0, 59.0, 40.0, 38.0, 22.0, 15.0, 21.0, 18.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6058225631713867, -0.5881983637809753, -0.5705742239952087, -0.5529500246047974, -0.5353258848190308, -0.5177016854286194, -0.5000775456428528, -0.4824533462524414, -0.4648291766643524, -0.4472050070762634, -0.42958083748817444, -0.41195666790008545, -0.3943324685096741, -0.37670832872390747, -0.3590841293334961, -0.3414599597454071, -0.3238357901573181, -0.3062116205692291, -0.28858745098114014, -0.27096328139305115, -0.25333911180496216, -0.23571492731571198, -0.2180907428264618, -0.2004665732383728, -0.1828424036502838, -0.16521823406219482, -0.14759406447410583, -0.12996987998485565, -0.11234571039676666, -0.09472154080867767, -0.07709736377000809, -0.0594731867313385, -0.04184907674789429, -0.024224903434515, -0.006600730121135712, 0.011023443192243576, 0.028647616505622864, 0.04627178609371185, 0.06389596313238144, 0.08152014017105103, 0.09914430975914001, 0.116768479347229, 0.134392648935318, 0.15201683342456818, 0.16964100301265717, 0.18726517260074615, 0.20488935708999634, 0.22251352667808533, 0.24013769626617432, 0.2577618658542633, 0.2753860354423523, 0.2930102050304413, 0.3106343746185303, 0.32825857400894165, 0.34588274359703064, 0.36350691318511963, 0.3811310827732086, 0.3987552523612976, 0.4163794219493866, 0.4340035915374756, 0.45162779092788696, 0.46925193071365356, 0.48687613010406494, 0.5045002698898315, 0.5221244692802429]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 13.0, 12.0, 10.0, 19.0, 16.0, 31.0, 41.0, 60.0, 108.0, 200.0, 432.0, 1133.0, 3974.0, 21125.0, 364981.0, 620383.0, 28594.0, 4945.0, 1377.0, 502.0, 192.0, 120.0, 51.0, 41.0, 40.0, 29.0, 21.0, 13.0, 8.0, 7.0, 13.0, 8.0, 10.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8408203125, -0.814605712890625, -0.78839111328125, -0.762176513671875, -0.7359619140625, -0.709747314453125, -0.68353271484375, -0.657318115234375, -0.631103515625, -0.604888916015625, -0.57867431640625, -0.552459716796875, -0.5262451171875, -0.500030517578125, -0.47381591796875, -0.447601318359375, -0.42138671875, -0.395172119140625, -0.36895751953125, -0.342742919921875, -0.3165283203125, -0.290313720703125, -0.26409912109375, -0.237884521484375, -0.211669921875, -0.185455322265625, -0.15924072265625, -0.133026123046875, -0.1068115234375, -0.080596923828125, -0.05438232421875, -0.028167724609375, -0.001953125, 0.024261474609375, 0.05047607421875, 0.076690673828125, 0.1029052734375, 0.129119873046875, 0.15533447265625, 0.181549072265625, 0.207763671875, 0.233978271484375, 0.26019287109375, 0.286407470703125, 0.3126220703125, 0.338836669921875, 0.36505126953125, 0.391265869140625, 0.41748046875, 0.443695068359375, 0.46990966796875, 0.496124267578125, 0.5223388671875, 0.548553466796875, 0.57476806640625, 0.600982666015625, 0.627197265625, 0.653411865234375, 0.67962646484375, 0.705841064453125, 0.7320556640625, 0.758270263671875, 0.78448486328125, 0.810699462890625, 0.8369140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 15.0, 28.0, 49.0, 76.0, 136.0, 203.0, 194.0, 117.0, 81.0, 37.0, 20.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1181640625, -0.11569547653198242, -0.11322689056396484, -0.11075830459594727, -0.10828971862792969, -0.10582113265991211, -0.10335254669189453, -0.10088396072387695, -0.09841537475585938, -0.0959467887878418, -0.09347820281982422, -0.09100961685180664, -0.08854103088378906, -0.08607244491577148, -0.0836038589477539, -0.08113527297973633, -0.07866668701171875, -0.07619810104370117, -0.0737295150756836, -0.07126092910766602, -0.06879234313964844, -0.06632375717163086, -0.06385517120361328, -0.0613865852355957, -0.058917999267578125, -0.05644941329956055, -0.05398082733154297, -0.05151224136352539, -0.04904365539550781, -0.046575069427490234, -0.044106483459472656, -0.04163789749145508, -0.0391693115234375, -0.03670072555541992, -0.034232139587402344, -0.031763553619384766, -0.029294967651367188, -0.02682638168334961, -0.02435779571533203, -0.021889209747314453, -0.019420623779296875, -0.016952037811279297, -0.014483451843261719, -0.01201486587524414, -0.009546279907226562, -0.007077693939208984, -0.004609107971191406, -0.002140522003173828, 0.00032806396484375, 0.002796649932861328, 0.005265235900878906, 0.007733821868896484, 0.010202407836914062, 0.01267099380493164, 0.015139579772949219, 0.017608165740966797, 0.020076751708984375, 0.022545337677001953, 0.02501392364501953, 0.02748250961303711, 0.029951095581054688, 0.032419681549072266, 0.034888267517089844, 0.03735685348510742, 0.039825439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 10.0, 6.0, 6.0, 7.0, 12.0, 30.0, 87.0, 472.0, 7848.0, 791643.0, 244937.0, 2999.0, 312.0, 76.0, 25.0, 15.0, 3.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.1943359375, -1.1529541015625, -1.111572265625, -1.0701904296875, -1.02880859375, -0.9874267578125, -0.946044921875, -0.9046630859375, -0.86328125, -0.8218994140625, -0.780517578125, -0.7391357421875, -0.69775390625, -0.6563720703125, -0.614990234375, -0.5736083984375, -0.5322265625, -0.4908447265625, -0.449462890625, -0.4080810546875, -0.36669921875, -0.3253173828125, -0.283935546875, -0.2425537109375, -0.201171875, -0.1597900390625, -0.118408203125, -0.0770263671875, -0.03564453125, 0.0057373046875, 0.047119140625, 0.0885009765625, 0.1298828125, 0.1712646484375, 0.212646484375, 0.2540283203125, 0.29541015625, 0.3367919921875, 0.378173828125, 0.4195556640625, 0.4609375, 0.5023193359375, 0.543701171875, 0.5850830078125, 0.62646484375, 0.6678466796875, 0.709228515625, 0.7506103515625, 0.7919921875, 0.8333740234375, 0.874755859375, 0.9161376953125, 0.95751953125, 0.9989013671875, 1.040283203125, 1.0816650390625, 1.123046875, 1.1644287109375, 1.205810546875, 1.2471923828125, 1.28857421875, 1.3299560546875, 1.371337890625, 1.4127197265625, 1.4541015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 15.0, 11.0, 12.0, 19.0, 22.0, 20.0, 20.0, 32.0, 33.0, 33.0, 33.0, 40.0, 42.0, 33.0, 36.0, 51.0, 46.0, 46.0, 39.0, 34.0, 47.0, 34.0, 33.0, 36.0, 33.0, 26.0, 22.0, 17.0, 21.0, 10.0, 15.0, 13.0, 10.0, 13.0, 6.0, 5.0, 10.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1451416015625, -0.14005470275878906, -0.13496780395507812, -0.1298809051513672, -0.12479400634765625, -0.11970710754394531, -0.11462020874023438, -0.10953330993652344, -0.1044464111328125, -0.09935951232910156, -0.09427261352539062, -0.08918571472167969, -0.08409881591796875, -0.07901191711425781, -0.07392501831054688, -0.06883811950683594, -0.063751220703125, -0.05866432189941406, -0.053577423095703125, -0.04849052429199219, -0.04340362548828125, -0.03831672668457031, -0.033229827880859375, -0.028142929077148438, -0.0230560302734375, -0.017969131469726562, -0.012882232666015625, -0.0077953338623046875, -0.00270843505859375, 0.0023784637451171875, 0.007465362548828125, 0.012552261352539062, 0.01763916015625, 0.022726058959960938, 0.027812957763671875, 0.03289985656738281, 0.03798675537109375, 0.04307365417480469, 0.048160552978515625, 0.05324745178222656, 0.0583343505859375, 0.06342124938964844, 0.06850814819335938, 0.07359504699707031, 0.07868194580078125, 0.08376884460449219, 0.08885574340820312, 0.09394264221191406, 0.099029541015625, 0.10411643981933594, 0.10920333862304688, 0.11429023742675781, 0.11937713623046875, 0.12446403503417969, 0.12955093383789062, 0.13463783264160156, 0.1397247314453125, 0.14481163024902344, 0.14989852905273438, 0.1549854278564453, 0.16007232666015625, 0.1651592254638672, 0.17024612426757812, 0.17533302307128906, 0.180419921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 15.0, 34.0, 127.0, 1855.0, 1044700.0, 1604.0, 119.0, 42.0, 19.0, 11.0, 8.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.84906005859375, -6.5301513671875, -6.21124267578125, -5.892333984375, -5.57342529296875, -5.2545166015625, -4.93560791015625, -4.61669921875, -4.29779052734375, -3.9788818359375, -3.65997314453125, -3.341064453125, -3.02215576171875, -2.7032470703125, -2.38433837890625, -2.0654296875, -1.74652099609375, -1.4276123046875, -1.10870361328125, -0.789794921875, -0.47088623046875, -0.1519775390625, 0.16693115234375, 0.48583984375, 0.80474853515625, 1.1236572265625, 1.44256591796875, 1.761474609375, 2.08038330078125, 2.3992919921875, 2.71820068359375, 3.037109375, 3.35601806640625, 3.6749267578125, 3.99383544921875, 4.312744140625, 4.63165283203125, 4.9505615234375, 5.26947021484375, 5.58837890625, 5.90728759765625, 6.2261962890625, 6.54510498046875, 6.864013671875, 7.18292236328125, 7.5018310546875, 7.82073974609375, 8.1396484375, 8.45855712890625, 8.7774658203125, 9.09637451171875, 9.415283203125, 9.73419189453125, 10.0531005859375, 10.37200927734375, 10.69091796875, 11.00982666015625, 11.3287353515625, 11.64764404296875, 11.966552734375, 12.28546142578125, 12.6043701171875, 12.92327880859375, 13.2421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 8.0, 10.0, 19.0, 27.0, 22.0, 36.0, 55.0, 65.0, 121.0, 129.0, 147.0, 89.0, 87.0, 53.0, 32.0, 27.0, 18.0, 12.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.064508438110352e-05, -7.841922342777252e-05, -7.619336247444153e-05, -7.396750152111053e-05, -7.174164056777954e-05, -6.951577961444855e-05, -6.728991866111755e-05, -6.506405770778656e-05, -6.283819675445557e-05, -6.061233580112457e-05, -5.838647484779358e-05, -5.6160613894462585e-05, -5.393475294113159e-05, -5.17088919878006e-05, -4.9483031034469604e-05, -4.725717008113861e-05, -4.503130912780762e-05, -4.2805448174476624e-05, -4.057958722114563e-05, -3.8353726267814636e-05, -3.612786531448364e-05, -3.390200436115265e-05, -3.1676143407821655e-05, -2.945028245449066e-05, -2.7224421501159668e-05, -2.4998560547828674e-05, -2.277269959449768e-05, -2.0546838641166687e-05, -1.8320977687835693e-05, -1.60951167345047e-05, -1.3869255781173706e-05, -1.1643394827842712e-05, -9.417533874511719e-06, -7.191672921180725e-06, -4.9658119678497314e-06, -2.739951014518738e-06, -5.140900611877441e-07, 1.7117708921432495e-06, 3.937631845474243e-06, 6.163492798805237e-06, 8.38935375213623e-06, 1.0615214705467224e-05, 1.2841075658798218e-05, 1.5066936612129211e-05, 1.7292797565460205e-05, 1.95186585187912e-05, 2.1744519472122192e-05, 2.3970380425453186e-05, 2.619624137878418e-05, 2.8422102332115173e-05, 3.064796328544617e-05, 3.287382423877716e-05, 3.5099685192108154e-05, 3.732554614543915e-05, 3.955140709877014e-05, 4.1777268052101135e-05, 4.400312900543213e-05, 4.622898995876312e-05, 4.8454850912094116e-05, 5.068071186542511e-05, 5.2906572818756104e-05, 5.51324337720871e-05, 5.735829472541809e-05, 5.9584155678749084e-05, 6.181001663208008e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 13.0, 24.0, 39.0, 77.0, 84.0, 173.0, 240.0, 567.0, 1027.0, 2899.0, 9040.0, 47778.0, 896184.0, 73264.0, 11442.0, 3223.0, 1214.0, 539.0, 289.0, 164.0, 92.0, 40.0, 44.0, 27.0, 16.0, 10.0, 6.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.775390625, -1.7281494140625, -1.680908203125, -1.6336669921875, -1.58642578125, -1.5391845703125, -1.491943359375, -1.4447021484375, -1.3974609375, -1.3502197265625, -1.302978515625, -1.2557373046875, -1.20849609375, -1.1612548828125, -1.114013671875, -1.0667724609375, -1.01953125, -0.9722900390625, -0.925048828125, -0.8778076171875, -0.83056640625, -0.7833251953125, -0.736083984375, -0.6888427734375, -0.6416015625, -0.5943603515625, -0.547119140625, -0.4998779296875, -0.45263671875, -0.4053955078125, -0.358154296875, -0.3109130859375, -0.263671875, -0.2164306640625, -0.169189453125, -0.1219482421875, -0.07470703125, -0.0274658203125, 0.019775390625, 0.0670166015625, 0.1142578125, 0.1614990234375, 0.208740234375, 0.2559814453125, 0.30322265625, 0.3504638671875, 0.397705078125, 0.4449462890625, 0.4921875, 0.5394287109375, 0.586669921875, 0.6339111328125, 0.68115234375, 0.7283935546875, 0.775634765625, 0.8228759765625, 0.8701171875, 0.9173583984375, 0.964599609375, 1.0118408203125, 1.05908203125, 1.1063232421875, 1.153564453125, 1.2008056640625, 1.248046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 4.0, 6.0, 10.0, 13.0, 13.0, 30.0, 44.0, 105.0, 213.0, 252.0, 135.0, 51.0, 28.0, 22.0, 8.0, 14.0, 14.0, 10.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9831161499023438, -0.9535369873046875, -0.9239578247070312, -0.894378662109375, -0.8647994995117188, -0.8352203369140625, -0.8056411743164062, -0.77606201171875, -0.7464828491210938, -0.7169036865234375, -0.6873245239257812, -0.657745361328125, -0.6281661987304688, -0.5985870361328125, -0.5690078735351562, -0.5394287109375, -0.5098495483398438, -0.4802703857421875, -0.45069122314453125, -0.421112060546875, -0.39153289794921875, -0.3619537353515625, -0.33237457275390625, -0.30279541015625, -0.27321624755859375, -0.2436370849609375, -0.21405792236328125, -0.184478759765625, -0.15489959716796875, -0.1253204345703125, -0.09574127197265625, -0.066162109375, -0.03658294677734375, -0.0070037841796875, 0.02257537841796875, 0.052154541015625, 0.08173370361328125, 0.1113128662109375, 0.14089202880859375, 0.17047119140625, 0.20005035400390625, 0.2296295166015625, 0.25920867919921875, 0.288787841796875, 0.31836700439453125, 0.3479461669921875, 0.37752532958984375, 0.4071044921875, 0.43668365478515625, 0.4662628173828125, 0.49584197998046875, 0.525421142578125, 0.5550003051757812, 0.5845794677734375, 0.6141586303710938, 0.64373779296875, 0.6733169555664062, 0.7028961181640625, 0.7324752807617188, 0.762054443359375, 0.7916336059570312, 0.8212127685546875, 0.8507919311523438, 0.88037109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 12.0, 16.0, 28.0, 78.0, 168.0, 213.0, 242.0, 108.0, 60.0, 31.0, 16.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.424810886383057, -5.306727409362793, -5.188643932342529, -5.070559978485107, -4.952476501464844, -4.83439302444458, -4.716309547424316, -4.598226070404053, -4.480142593383789, -4.362059116363525, -4.243975639343262, -4.12589168548584, -4.007808208465576, -3.8897247314453125, -3.771641254425049, -3.653557777404785, -3.5354738235473633, -3.4173903465270996, -3.299306631088257, -3.181223154067993, -3.0631394386291504, -2.9450559616088867, -2.826972484588623, -2.7088890075683594, -2.5908052921295166, -2.472721815109253, -2.35463809967041, -2.2365546226501465, -2.118471145629883, -2.00038743019104, -1.8823039531707764, -1.7642203569412231, -1.646136999130249, -1.5280534029006958, -1.4099698066711426, -1.291886329650879, -1.1738027334213257, -1.0557191371917725, -0.937635600566864, -0.8195520639419556, -0.7014684677124023, -0.5833848714828491, -0.4653013348579407, -0.34721776843070984, -0.229134202003479, -0.11105060577392578, 0.007032930850982666, 0.1251164674758911, 0.24320006370544434, 0.36128363013267517, 0.479367196559906, 0.5974507331848145, 0.7155343294143677, 0.8336179256439209, 0.9517014622688293, 1.0697849988937378, 1.187868595123291, 1.3059521913528442, 1.4240357875823975, 1.5421192646026611, 1.6602028608322144, 1.7782864570617676, 1.8963699340820312, 2.014453411102295, 2.1325371265411377]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 23.0, 34.0, 36.0, 42.0, 61.0, 64.0, 79.0, 81.0, 85.0, 86.0, 70.0, 63.0, 45.0, 49.0, 40.0, 27.0, 19.0, 19.0, 9.0, 10.0, 2.0, 3.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.428568124771118, -2.3419911861419678, -2.2554140090942383, -2.168837070465088, -2.0822601318359375, -1.995682954788208, -1.9091060161590576, -1.8225289583206177, -1.7359519004821777, -1.6493748426437378, -1.5627977848052979, -1.4762208461761475, -1.3896437883377075, -1.3030667304992676, -1.2164897918701172, -1.1299127340316772, -1.0433356761932373, -0.9567586183547974, -0.8701816201210022, -0.783604621887207, -0.6970275640487671, -0.6104505062103271, -0.523873507976532, -0.4372965097427368, -0.3507194519042969, -0.2641424238681793, -0.17756539583206177, -0.09098836779594421, -0.00441133975982666, 0.0821656882762909, 0.16874271631240845, 0.2553197145462036, 0.34189653396606445, 0.428473562002182, 0.5150505900382996, 0.6016275882720947, 0.6882046461105347, 0.7747817039489746, 0.8613587021827698, 0.9479357004165649, 1.0345127582550049, 1.1210898160934448, 1.2076668739318848, 1.2942438125610352, 1.380820870399475, 1.467397928237915, 1.5539748668670654, 1.6405519247055054, 1.7271289825439453, 1.8137060403823853, 1.9002830982208252, 1.9868600368499756, 2.073437213897705, 2.1600141525268555, 2.246591091156006, 2.3331680297851562, 2.4197452068328857, 2.506322145462036, 2.5928993225097656, 2.679476261138916, 2.7660531997680664, 2.852630376815796, 2.9392073154449463, 3.025784492492676, 3.112361431121826]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 13.0, 19.0, 22.0, 35.0, 47.0, 59.0, 66.0, 101.0, 115.0, 191.0, 276.0, 535.0, 906.0, 1633.0, 3404.0, 9100.0, 33407.0, 747845.0, 3329821.0, 46385.0, 11405.0, 4423.0, 1922.0, 1040.0, 573.0, 338.0, 215.0, 126.0, 69.0, 48.0, 31.0, 24.0, 19.0, 14.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0], "bins": [-1.12109375, -1.09002685546875, -1.0589599609375, -1.02789306640625, -0.996826171875, -0.96575927734375, -0.9346923828125, -0.90362548828125, -0.87255859375, -0.84149169921875, -0.8104248046875, -0.77935791015625, -0.748291015625, -0.71722412109375, -0.6861572265625, -0.65509033203125, -0.6240234375, -0.59295654296875, -0.5618896484375, -0.53082275390625, -0.499755859375, -0.46868896484375, -0.4376220703125, -0.40655517578125, -0.37548828125, -0.34442138671875, -0.3133544921875, -0.28228759765625, -0.251220703125, -0.22015380859375, -0.1890869140625, -0.15802001953125, -0.126953125, -0.09588623046875, -0.0648193359375, -0.03375244140625, -0.002685546875, 0.02838134765625, 0.0594482421875, 0.09051513671875, 0.12158203125, 0.15264892578125, 0.1837158203125, 0.21478271484375, 0.245849609375, 0.27691650390625, 0.3079833984375, 0.33905029296875, 0.3701171875, 0.40118408203125, 0.4322509765625, 0.46331787109375, 0.494384765625, 0.52545166015625, 0.5565185546875, 0.58758544921875, 0.61865234375, 0.64971923828125, 0.6807861328125, 0.71185302734375, 0.742919921875, 0.77398681640625, 0.8050537109375, 0.83612060546875, 0.8671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 6.0, 7.0, 13.0, 11.0, 29.0, 33.0, 56.0, 59.0, 102.0, 121.0, 114.0, 102.0, 84.0, 58.0, 46.0, 42.0, 23.0, 21.0, 18.0, 11.0, 5.0, 8.0, 7.0, 7.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054595947265625, -0.05306053161621094, -0.051525115966796875, -0.04998970031738281, -0.04845428466796875, -0.04691886901855469, -0.045383453369140625, -0.04384803771972656, -0.0423126220703125, -0.04077720642089844, -0.039241790771484375, -0.03770637512207031, -0.03617095947265625, -0.03463554382324219, -0.033100128173828125, -0.03156471252441406, -0.030029296875, -0.028493881225585938, -0.026958465576171875, -0.025423049926757812, -0.02388763427734375, -0.022352218627929688, -0.020816802978515625, -0.019281387329101562, -0.0177459716796875, -0.016210556030273438, -0.014675140380859375, -0.013139724731445312, -0.01160430908203125, -0.010068893432617188, -0.008533477783203125, -0.0069980621337890625, -0.005462646484375, -0.0039272308349609375, -0.002391815185546875, -0.0008563995361328125, 0.00067901611328125, 0.0022144317626953125, 0.003749847412109375, 0.0052852630615234375, 0.0068206787109375, 0.008356094360351562, 0.009891510009765625, 0.011426925659179688, 0.01296234130859375, 0.014497756958007812, 0.016033172607421875, 0.017568588256835938, 0.01910400390625, 0.020639419555664062, 0.022174835205078125, 0.023710250854492188, 0.02524566650390625, 0.026781082153320312, 0.028316497802734375, 0.029851913452148438, 0.0313873291015625, 0.03292274475097656, 0.034458160400390625, 0.03599357604980469, 0.03752899169921875, 0.03906440734863281, 0.040599822998046875, 0.04213523864746094, 0.043670654296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 1.0, 5.0, 12.0, 11.0, 8.0, 19.0, 11.0, 26.0, 28.0, 57.0, 125.0, 313.0, 1183.0, 8582.0, 253006.0, 3894634.0, 32441.0, 2819.0, 550.0, 192.0, 76.0, 41.0, 44.0, 19.0, 11.0, 14.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.875, -1.8246612548828125, -1.774322509765625, -1.7239837646484375, -1.67364501953125, -1.6233062744140625, -1.572967529296875, -1.5226287841796875, -1.4722900390625, -1.4219512939453125, -1.371612548828125, -1.3212738037109375, -1.27093505859375, -1.2205963134765625, -1.170257568359375, -1.1199188232421875, -1.069580078125, -1.0192413330078125, -0.968902587890625, -0.9185638427734375, -0.86822509765625, -0.8178863525390625, -0.767547607421875, -0.7172088623046875, -0.6668701171875, -0.6165313720703125, -0.566192626953125, -0.5158538818359375, -0.46551513671875, -0.4151763916015625, -0.364837646484375, -0.3144989013671875, -0.26416015625, -0.2138214111328125, -0.163482666015625, -0.1131439208984375, -0.06280517578125, -0.0124664306640625, 0.037872314453125, 0.0882110595703125, 0.1385498046875, 0.1888885498046875, 0.239227294921875, 0.2895660400390625, 0.33990478515625, 0.3902435302734375, 0.440582275390625, 0.4909210205078125, 0.541259765625, 0.5915985107421875, 0.641937255859375, 0.6922760009765625, 0.74261474609375, 0.7929534912109375, 0.843292236328125, 0.8936309814453125, 0.9439697265625, 0.9943084716796875, 1.044647216796875, 1.0949859619140625, 1.14532470703125, 1.1956634521484375, 1.246002197265625, 1.2963409423828125, 1.3466796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 8.0, 13.0, 18.0, 18.0, 24.0, 42.0, 53.0, 92.0, 131.0, 254.0, 661.0, 1392.0, 633.0, 294.0, 168.0, 71.0, 62.0, 32.0, 22.0, 18.0, 13.0, 8.0, 9.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07125282287597656, -0.06822586059570312, -0.06519889831542969, -0.06217193603515625, -0.05914497375488281, -0.056118011474609375, -0.05309104919433594, -0.0500640869140625, -0.04703712463378906, -0.044010162353515625, -0.04098320007324219, -0.03795623779296875, -0.03492927551269531, -0.031902313232421875, -0.028875350952148438, -0.025848388671875, -0.022821426391601562, -0.019794464111328125, -0.016767501831054688, -0.01374053955078125, -0.010713577270507812, -0.007686614990234375, -0.0046596527099609375, -0.0016326904296875, 0.0013942718505859375, 0.004421234130859375, 0.0074481964111328125, 0.01047515869140625, 0.013502120971679688, 0.016529083251953125, 0.019556045532226562, 0.0225830078125, 0.025609970092773438, 0.028636932373046875, 0.03166389465332031, 0.03469085693359375, 0.03771781921386719, 0.040744781494140625, 0.04377174377441406, 0.0467987060546875, 0.04982566833496094, 0.052852630615234375, 0.05587959289550781, 0.05890655517578125, 0.06193351745605469, 0.06496047973632812, 0.06798744201660156, 0.071014404296875, 0.07404136657714844, 0.07706832885742188, 0.08009529113769531, 0.08312225341796875, 0.08614921569824219, 0.08917617797851562, 0.09220314025878906, 0.0952301025390625, 0.09825706481933594, 0.10128402709960938, 0.10431098937988281, 0.10733795166015625, 0.11036491394042969, 0.11339187622070312, 0.11641883850097656, 0.11944580078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 18.0, 245.0, 529.0, 147.0, 43.0, 8.0, 8.0, 3.0, 1.0], "bins": [-4.585784435272217, -4.505848407745361, -4.425912380218506, -4.34597635269165, -4.266040802001953, -4.186104774475098, -4.106168746948242, -4.026232719421387, -3.9462966918945312, -3.866360664367676, -3.7864246368408203, -3.706488847732544, -3.6265528202056885, -3.546616792678833, -3.4666810035705566, -3.386744976043701, -3.3068089485168457, -3.2268729209899902, -3.1469368934631348, -3.0670011043548584, -2.987065076828003, -2.9071290493011475, -2.827193260192871, -2.7472572326660156, -2.66732120513916, -2.5873851776123047, -2.507449150085449, -2.427513360977173, -2.3475773334503174, -2.267641305923462, -2.1877055168151855, -2.10776948928833, -2.0278334617614746, -1.9478974342346191, -1.8679615259170532, -1.7880256175994873, -1.7080895900726318, -1.6281535625457764, -1.5482176542282104, -1.4682817459106445, -1.388345718383789, -1.3084096908569336, -1.2284737825393677, -1.1485378742218018, -1.0686018466949463, -0.9886658787727356, -0.9087299108505249, -0.8287939429283142, -0.7488580346107483, -0.6689220666885376, -0.5889860987663269, -0.5090501308441162, -0.4291141629219055, -0.3491781949996948, -0.26924222707748413, -0.18930625915527344, -0.10937029123306274, -0.02943432331085205, 0.05050164461135864, 0.13043761253356934, 0.21037358045578003, 0.2903095483779907, 0.3702455163002014, 0.4501814842224121, 0.5301174521446228]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 13.0, 17.0, 20.0, 50.0, 61.0, 78.0, 83.0, 105.0, 134.0, 90.0, 81.0, 79.0, 55.0, 48.0, 32.0, 18.0, 12.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.3663687705993652, -1.3385528326034546, -1.310736894607544, -1.2829209566116333, -1.2551050186157227, -1.2272891998291016, -1.1994731426239014, -1.1716573238372803, -1.1438413858413696, -1.116025447845459, -1.0882095098495483, -1.0603935718536377, -1.032577633857727, -1.0047616958618164, -0.9769458174705505, -0.9491298794746399, -0.9213139414787292, -0.8934980034828186, -0.865682065486908, -0.8378661870956421, -0.8100502490997314, -0.7822343111038208, -0.7544183731079102, -0.7266024351119995, -0.6987864971160889, -0.6709705591201782, -0.6431546211242676, -0.6153386831283569, -0.5875228047370911, -0.5597068667411804, -0.5318909287452698, -0.5040749907493591, -0.47625917196273804, -0.4484432339668274, -0.42062732577323914, -0.3928113877773285, -0.36499547958374023, -0.3371795415878296, -0.30936360359191895, -0.2815476655960083, -0.25373175740242004, -0.2259158343076706, -0.19809991121292114, -0.1702839732170105, -0.14246805012226105, -0.1146521270275116, -0.08683618903160095, -0.0590202659368515, -0.03120434284210205, -0.0033884160220623016, 0.024427510797977448, 0.052243441343307495, 0.08005936443805695, 0.1078752875328064, 0.13569122552871704, 0.1635071486234665, 0.19132307171821594, 0.2191389948129654, 0.24695491790771484, 0.2747708559036255, 0.30258679389953613, 0.3304027020931244, 0.35821864008903503, 0.3860345482826233, 0.41385048627853394]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 13.0, 17.0, 19.0, 20.0, 30.0, 43.0, 38.0, 50.0, 49.0, 56.0, 61.0, 604.0, 201236.0, 844680.0, 1182.0, 87.0, 48.0, 39.0, 41.0, 39.0, 26.0, 24.0, 32.0, 22.0, 13.0, 13.0, 7.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6328125, -2.54534912109375, -2.4578857421875, -2.37042236328125, -2.282958984375, -2.19549560546875, -2.1080322265625, -2.02056884765625, -1.93310546875, -1.84564208984375, -1.7581787109375, -1.67071533203125, -1.583251953125, -1.49578857421875, -1.4083251953125, -1.32086181640625, -1.2333984375, -1.14593505859375, -1.0584716796875, -0.97100830078125, -0.883544921875, -0.79608154296875, -0.7086181640625, -0.62115478515625, -0.53369140625, -0.44622802734375, -0.3587646484375, -0.27130126953125, -0.183837890625, -0.09637451171875, -0.0089111328125, 0.07855224609375, 0.166015625, 0.25347900390625, 0.3409423828125, 0.42840576171875, 0.515869140625, 0.60333251953125, 0.6907958984375, 0.77825927734375, 0.86572265625, 0.95318603515625, 1.0406494140625, 1.12811279296875, 1.215576171875, 1.30303955078125, 1.3905029296875, 1.47796630859375, 1.5654296875, 1.65289306640625, 1.7403564453125, 1.82781982421875, 1.915283203125, 2.00274658203125, 2.0902099609375, 2.17767333984375, 2.26513671875, 2.35260009765625, 2.4400634765625, 2.52752685546875, 2.614990234375, 2.70245361328125, 2.7899169921875, 2.87738037109375, 2.96484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 16.0, 74.0, 257.0, 356.0, 224.0, 62.0, 17.0, 4.0, 1.0, 2.0], "bins": [-0.36865234375, -0.3622255325317383, -0.35579872131347656, -0.34937191009521484, -0.3429450988769531, -0.3365182876586914, -0.3300914764404297, -0.32366466522216797, -0.31723785400390625, -0.31081104278564453, -0.3043842315673828, -0.2979574203491211, -0.2915306091308594, -0.28510379791259766, -0.27867698669433594, -0.2722501754760742, -0.2658233642578125, -0.2593965530395508, -0.25296974182128906, -0.24654293060302734, -0.24011611938476562, -0.2336893081665039, -0.2272624969482422, -0.22083568572998047, -0.21440887451171875, -0.20798206329345703, -0.2015552520751953, -0.1951284408569336, -0.18870162963867188, -0.18227481842041016, -0.17584800720214844, -0.16942119598388672, -0.162994384765625, -0.15656757354736328, -0.15014076232910156, -0.14371395111083984, -0.13728713989257812, -0.1308603286743164, -0.12443351745605469, -0.11800670623779297, -0.11157989501953125, -0.10515308380126953, -0.09872627258300781, -0.0922994613647461, -0.08587265014648438, -0.07944583892822266, -0.07301902770996094, -0.06659221649169922, -0.0601654052734375, -0.05373859405517578, -0.04731178283691406, -0.040884971618652344, -0.034458160400390625, -0.028031349182128906, -0.021604537963867188, -0.015177726745605469, -0.00875091552734375, -0.0023241043090820312, 0.0041027069091796875, 0.010529518127441406, 0.016956329345703125, 0.023383140563964844, 0.029809951782226562, 0.03623676300048828, 0.04266357421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 15.0, 21.0, 27.0, 34.0, 54.0, 101.0, 163.0, 307.0, 705.0, 1779.0, 5795.0, 24837.0, 165652.0, 622193.0, 189517.0, 27701.0, 6169.0, 1923.0, 748.0, 370.0, 180.0, 90.0, 50.0, 34.0, 23.0, 15.0, 13.0, 4.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.79296875, -0.7706527709960938, -0.7483367919921875, -0.7260208129882812, -0.703704833984375, -0.6813888549804688, -0.6590728759765625, -0.6367568969726562, -0.61444091796875, -0.5921249389648438, -0.5698089599609375, -0.5474929809570312, -0.525177001953125, -0.5028610229492188, -0.4805450439453125, -0.45822906494140625, -0.4359130859375, -0.41359710693359375, -0.3912811279296875, -0.36896514892578125, -0.346649169921875, -0.32433319091796875, -0.3020172119140625, -0.27970123291015625, -0.25738525390625, -0.23506927490234375, -0.2127532958984375, -0.19043731689453125, -0.168121337890625, -0.14580535888671875, -0.1234893798828125, -0.10117340087890625, -0.078857421875, -0.05654144287109375, -0.0342254638671875, -0.01190948486328125, 0.010406494140625, 0.03272247314453125, 0.0550384521484375, 0.07735443115234375, 0.09967041015625, 0.12198638916015625, 0.1443023681640625, 0.16661834716796875, 0.188934326171875, 0.21125030517578125, 0.2335662841796875, 0.25588226318359375, 0.2781982421875, 0.30051422119140625, 0.3228302001953125, 0.34514617919921875, 0.367462158203125, 0.38977813720703125, 0.4120941162109375, 0.43441009521484375, 0.45672607421875, 0.47904205322265625, 0.5013580322265625, 0.5236740112304688, 0.545989990234375, 0.5683059692382812, 0.5906219482421875, 0.6129379272460938, 0.63525390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 7.0, 6.0, 11.0, 12.0, 19.0, 13.0, 19.0, 20.0, 26.0, 36.0, 49.0, 40.0, 42.0, 37.0, 45.0, 51.0, 45.0, 61.0, 51.0, 59.0, 41.0, 48.0, 31.0, 38.0, 31.0, 26.0, 23.0, 20.0, 16.0, 15.0, 9.0, 9.0, 7.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.314697265625, -0.3054008483886719, -0.29610443115234375, -0.2868080139160156, -0.2775115966796875, -0.2682151794433594, -0.25891876220703125, -0.24962234497070312, -0.240325927734375, -0.23102951049804688, -0.22173309326171875, -0.21243667602539062, -0.2031402587890625, -0.19384384155273438, -0.18454742431640625, -0.17525100708007812, -0.16595458984375, -0.15665817260742188, -0.14736175537109375, -0.13806533813476562, -0.1287689208984375, -0.11947250366210938, -0.11017608642578125, -0.10087966918945312, -0.091583251953125, -0.08228683471679688, -0.07299041748046875, -0.06369400024414062, -0.0543975830078125, -0.045101165771484375, -0.03580474853515625, -0.026508331298828125, -0.0172119140625, -0.007915496826171875, 0.00138092041015625, 0.010677337646484375, 0.0199737548828125, 0.029270172119140625, 0.03856658935546875, 0.047863006591796875, 0.057159423828125, 0.06645584106445312, 0.07575225830078125, 0.08504867553710938, 0.0943450927734375, 0.10364151000976562, 0.11293792724609375, 0.12223434448242188, 0.13153076171875, 0.14082717895507812, 0.15012359619140625, 0.15942001342773438, 0.1687164306640625, 0.17801284790039062, 0.18730926513671875, 0.19660568237304688, 0.205902099609375, 0.21519851684570312, 0.22449493408203125, 0.23379135131835938, 0.2430877685546875, 0.2523841857910156, 0.26168060302734375, 0.2709770202636719, 0.2802734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 10.0, 5.0, 19.0, 18.0, 30.0, 44.0, 60.0, 84.0, 146.0, 176.0, 323.0, 573.0, 1032.0, 2257.0, 5781.0, 18391.0, 83155.0, 412102.0, 411744.0, 83603.0, 18371.0, 5731.0, 2377.0, 1087.0, 550.0, 281.0, 174.0, 134.0, 96.0, 46.0, 36.0, 28.0, 19.0, 12.0, 9.0, 13.0, 5.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.556640625, -0.5419921875, -0.52734375, -0.5126953125, -0.498046875, -0.4833984375, -0.46875, -0.4541015625, -0.439453125, -0.4248046875, -0.41015625, -0.3955078125, -0.380859375, -0.3662109375, -0.3515625, -0.3369140625, -0.322265625, -0.3076171875, -0.29296875, -0.2783203125, -0.263671875, -0.2490234375, -0.234375, -0.2197265625, -0.205078125, -0.1904296875, -0.17578125, -0.1611328125, -0.146484375, -0.1318359375, -0.1171875, -0.1025390625, -0.087890625, -0.0732421875, -0.05859375, -0.0439453125, -0.029296875, -0.0146484375, 0.0, 0.0146484375, 0.029296875, 0.0439453125, 0.05859375, 0.0732421875, 0.087890625, 0.1025390625, 0.1171875, 0.1318359375, 0.146484375, 0.1611328125, 0.17578125, 0.1904296875, 0.205078125, 0.2197265625, 0.234375, 0.2490234375, 0.263671875, 0.2783203125, 0.29296875, 0.3076171875, 0.322265625, 0.3369140625, 0.3515625, 0.3662109375, 0.380859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 4.0, 9.0, 9.0, 13.0, 18.0, 36.0, 39.0, 60.0, 108.0, 109.0, 149.0, 123.0, 88.0, 78.0, 50.0, 31.0, 16.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010305643081665039, -0.00010038074105978012, -9.770505130290985e-05, -9.502936154603958e-05, -9.235367178916931e-05, -8.967798203229904e-05, -8.700229227542877e-05, -8.43266025185585e-05, -8.165091276168823e-05, -7.897522300481796e-05, -7.629953324794769e-05, -7.362384349107742e-05, -7.094815373420715e-05, -6.827246397733688e-05, -6.559677422046661e-05, -6.292108446359634e-05, -6.0245394706726074e-05, -5.7569704949855804e-05, -5.4894015192985535e-05, -5.2218325436115265e-05, -4.9542635679244995e-05, -4.6866945922374725e-05, -4.4191256165504456e-05, -4.1515566408634186e-05, -3.8839876651763916e-05, -3.6164186894893646e-05, -3.3488497138023376e-05, -3.081280738115311e-05, -2.8137117624282837e-05, -2.5461427867412567e-05, -2.2785738110542297e-05, -2.0110048353672028e-05, -1.7434358596801758e-05, -1.4758668839931488e-05, -1.2082979083061218e-05, -9.407289326190948e-06, -6.731599569320679e-06, -4.055909812450409e-06, -1.3802200555801392e-06, 1.2954697012901306e-06, 3.9711594581604e-06, 6.64684921503067e-06, 9.32253897190094e-06, 1.199822872877121e-05, 1.467391848564148e-05, 1.734960824251175e-05, 2.002529799938202e-05, 2.270098775625229e-05, 2.537667751312256e-05, 2.805236726999283e-05, 3.07280570268631e-05, 3.340374678373337e-05, 3.607943654060364e-05, 3.875512629747391e-05, 4.143081605434418e-05, 4.410650581121445e-05, 4.678219556808472e-05, 4.9457885324954987e-05, 5.2133575081825256e-05, 5.4809264838695526e-05, 5.7484954595565796e-05, 6.0160644352436066e-05, 6.283633410930634e-05, 6.55120238661766e-05, 6.818771362304688e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 15.0, 13.0, 26.0, 46.0, 69.0, 124.0, 221.0, 379.0, 956.0, 2553.0, 9792.0, 91500.0, 837106.0, 91716.0, 9581.0, 2611.0, 918.0, 391.0, 216.0, 115.0, 71.0, 50.0, 23.0, 21.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.125, -1.0923919677734375, -1.059783935546875, -1.0271759033203125, -0.99456787109375, -0.9619598388671875, -0.929351806640625, -0.8967437744140625, -0.8641357421875, -0.8315277099609375, -0.798919677734375, -0.7663116455078125, -0.73370361328125, -0.7010955810546875, -0.668487548828125, -0.6358795166015625, -0.603271484375, -0.5706634521484375, -0.538055419921875, -0.5054473876953125, -0.47283935546875, -0.4402313232421875, -0.407623291015625, -0.3750152587890625, -0.3424072265625, -0.3097991943359375, -0.277191162109375, -0.2445831298828125, -0.21197509765625, -0.1793670654296875, -0.146759033203125, -0.1141510009765625, -0.08154296875, -0.0489349365234375, -0.016326904296875, 0.0162811279296875, 0.04888916015625, 0.0814971923828125, 0.114105224609375, 0.1467132568359375, 0.1793212890625, 0.2119293212890625, 0.244537353515625, 0.2771453857421875, 0.30975341796875, 0.3423614501953125, 0.374969482421875, 0.4075775146484375, 0.440185546875, 0.4727935791015625, 0.505401611328125, 0.5380096435546875, 0.57061767578125, 0.6032257080078125, 0.635833740234375, 0.6684417724609375, 0.7010498046875, 0.7336578369140625, 0.766265869140625, 0.7988739013671875, 0.83148193359375, 0.8640899658203125, 0.896697998046875, 0.9293060302734375, 0.9619140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 12.0, 13.0, 35.0, 77.0, 128.0, 187.0, 192.0, 149.0, 91.0, 53.0, 27.0, 15.0, 9.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6266517639160156, -0.6107254028320312, -0.5947990417480469, -0.5788726806640625, -0.5629463195800781, -0.5470199584960938, -0.5310935974121094, -0.515167236328125, -0.4992408752441406, -0.48331451416015625, -0.4673881530761719, -0.4514617919921875, -0.4355354309082031, -0.41960906982421875, -0.4036827087402344, -0.38775634765625, -0.3718299865722656, -0.35590362548828125, -0.3399772644042969, -0.3240509033203125, -0.3081245422363281, -0.29219818115234375, -0.2762718200683594, -0.260345458984375, -0.24441909790039062, -0.22849273681640625, -0.21256637573242188, -0.1966400146484375, -0.18071365356445312, -0.16478729248046875, -0.14886093139648438, -0.1329345703125, -0.11700820922851562, -0.10108184814453125, -0.08515548706054688, -0.0692291259765625, -0.053302764892578125, -0.03737640380859375, -0.021450042724609375, -0.005523681640625, 0.010402679443359375, 0.02632904052734375, 0.042255401611328125, 0.0581817626953125, 0.07410812377929688, 0.09003448486328125, 0.10596084594726562, 0.12188720703125, 0.13781356811523438, 0.15373992919921875, 0.16966629028320312, 0.1855926513671875, 0.20151901245117188, 0.21744537353515625, 0.23337173461914062, 0.249298095703125, 0.2652244567871094, 0.28115081787109375, 0.2970771789550781, 0.3130035400390625, 0.3289299011230469, 0.34485626220703125, 0.3607826232910156, 0.376708984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 19.0, 68.0, 250.0, 356.0, 190.0, 79.0, 23.0, 7.0, 9.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.066506385803223, -3.8166847229003906, -3.5668630599975586, -3.3170413970947266, -3.0672199726104736, -2.8173983097076416, -2.5675766468048096, -2.3177552223205566, -2.0679335594177246, -1.8181118965148926, -1.56829035282135, -1.318468689918518, -1.0686471462249756, -0.8188254833221436, -0.5690038204193115, -0.31918227672576904, -0.06936049461364746, 0.180461123585701, 0.43028274178504944, 0.6801043748855591, 0.9299259781837463, 1.1797475814819336, 1.4295692443847656, 1.679390788078308, 1.9292124509811401, 2.1790339946746826, 2.4288556575775146, 2.6786773204803467, 2.9284989833831787, 3.1783204078674316, 3.4281420707702637, 3.6779637336730957, 3.9277853965759277, 4.17760705947876, 4.427428722381592, 4.677250385284424, 4.927072048187256, 5.17689323425293, 5.426714897155762, 5.676536560058594, 5.926358222961426, 6.176179885864258, 6.42600154876709, 6.675823211669922, 6.925644874572754, 7.175466537475586, 7.425288200378418, 7.675109386444092, 7.924931526184082, 8.174753189086914, 8.424574851989746, 8.674396514892578, 8.92421817779541, 9.174039840698242, 9.423861503601074, 9.673683166503906, 9.923503875732422, 10.173325538635254, 10.423147201538086, 10.672968864440918, 10.92279052734375, 11.172612190246582, 11.422433853149414, 11.672255516052246, 11.922077178955078]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 8.0, 11.0, 14.0, 21.0, 28.0, 23.0, 38.0, 29.0, 44.0, 40.0, 44.0, 45.0, 53.0, 66.0, 59.0, 59.0, 53.0, 51.0, 51.0, 43.0, 33.0, 38.0, 25.0, 27.0, 15.0, 25.0, 17.0, 8.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.217620849609375, -2.146178960800171, -2.074737071990967, -2.003295421600342, -1.9318535327911377, -1.8604116439819336, -1.7889697551727295, -1.7175278663635254, -1.6460860967636108, -1.5746442079544067, -1.5032024383544922, -1.431760549545288, -1.360318660736084, -1.2888768911361694, -1.2174350023269653, -1.1459932327270508, -1.0745513439178467, -1.0031094551086426, -0.931667685508728, -0.8602257966995239, -0.7887839674949646, -0.7173421382904053, -0.6459002494812012, -0.5744584202766418, -0.5030165910720825, -0.4315747618675232, -0.3601329028606415, -0.28869104385375977, -0.21724921464920044, -0.1458073854446411, -0.0743655264377594, -0.0029236674308776855, 0.06851816177368164, 0.13996000587940216, 0.21140184998512268, 0.2828437089920044, 0.3542855381965637, 0.42572736740112305, 0.49716922640800476, 0.5686110854148865, 0.6400529146194458, 0.7114947438240051, 0.7829365730285645, 0.8543784618377686, 0.9258202910423279, 0.9972621202468872, 1.0687040090560913, 1.1401457786560059, 1.21158766746521, 1.283029556274414, 1.3544713258743286, 1.4259132146835327, 1.4973549842834473, 1.5687968730926514, 1.6402387619018555, 1.7116806507110596, 1.7831224203109741, 1.8545643091201782, 1.9260060787200928, 1.9974479675292969, 2.068889856338501, 2.140331745147705, 2.21177339553833, 2.283215284347534, 2.3546571731567383]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 9.0, 14.0, 22.0, 32.0, 60.0, 82.0, 120.0, 226.0, 474.0, 14112.0, 4177800.0, 1107.0, 139.0, 62.0, 14.0, 7.0, 3.0, 3.0], "bins": [-14.96875, -14.70281982421875, -14.4368896484375, -14.17095947265625, -13.905029296875, -13.63909912109375, -13.3731689453125, -13.10723876953125, -12.84130859375, -12.57537841796875, -12.3094482421875, -12.04351806640625, -11.777587890625, -11.51165771484375, -11.2457275390625, -10.97979736328125, -10.7138671875, -10.44793701171875, -10.1820068359375, -9.91607666015625, -9.650146484375, -9.38421630859375, -9.1182861328125, -8.85235595703125, -8.58642578125, -8.32049560546875, -8.0545654296875, -7.78863525390625, -7.522705078125, -7.25677490234375, -6.9908447265625, -6.72491455078125, -6.458984375, -6.19305419921875, -5.9271240234375, -5.66119384765625, -5.395263671875, -5.12933349609375, -4.8634033203125, -4.59747314453125, -4.33154296875, -4.06561279296875, -3.7996826171875, -3.53375244140625, -3.267822265625, -3.00189208984375, -2.7359619140625, -2.47003173828125, -2.2041015625, -1.93817138671875, -1.6722412109375, -1.40631103515625, -1.140380859375, -0.87445068359375, -0.6085205078125, -0.34259033203125, -0.07666015625, 0.18927001953125, 0.4552001953125, 0.72113037109375, 0.987060546875, 1.25299072265625, 1.5189208984375, 1.78485107421875, 2.05078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 28.0, 63.0, 154.0, 210.0, 235.0, 156.0, 85.0, 50.0, 8.0, 8.0, 1.0, 4.0], "bins": [-0.373046875, -0.3663954734802246, -0.3597440719604492, -0.35309267044067383, -0.34644126892089844, -0.33978986740112305, -0.33313846588134766, -0.32648706436157227, -0.3198356628417969, -0.3131842613220215, -0.3065328598022461, -0.2998814582824707, -0.2932300567626953, -0.2865786552429199, -0.27992725372314453, -0.27327585220336914, -0.26662445068359375, -0.25997304916381836, -0.25332164764404297, -0.24667024612426758, -0.2400188446044922, -0.2333674430847168, -0.2267160415649414, -0.22006464004516602, -0.21341323852539062, -0.20676183700561523, -0.20011043548583984, -0.19345903396606445, -0.18680763244628906, -0.18015623092651367, -0.17350482940673828, -0.1668534278869629, -0.1602020263671875, -0.1535506248474121, -0.14689922332763672, -0.14024782180786133, -0.13359642028808594, -0.12694501876831055, -0.12029361724853516, -0.11364221572875977, -0.10699081420898438, -0.10033941268920898, -0.0936880111694336, -0.0870366096496582, -0.08038520812988281, -0.07373380661010742, -0.06708240509033203, -0.06043100357055664, -0.05377960205078125, -0.04712820053100586, -0.04047679901123047, -0.03382539749145508, -0.027173995971679688, -0.020522594451904297, -0.013871192932128906, -0.007219791412353516, -0.000568389892578125, 0.006083011627197266, 0.012734413146972656, 0.019385814666748047, 0.026037216186523438, 0.03268861770629883, 0.03934001922607422, 0.04599142074584961, 0.052642822265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 14.0, 28.0, 49.0, 42.0, 64.0, 120.0, 171.0, 272.0, 1264.0, 202102.0, 3986110.0, 2882.0, 483.0, 216.0, 149.0, 95.0, 58.0, 40.0, 36.0, 15.0, 15.0, 9.0, 6.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.859375, -8.658538818359375, -8.45770263671875, -8.256866455078125, -8.0560302734375, -7.855194091796875, -7.65435791015625, -7.453521728515625, -7.252685546875, -7.051849365234375, -6.85101318359375, -6.650177001953125, -6.4493408203125, -6.248504638671875, -6.04766845703125, -5.846832275390625, -5.64599609375, -5.445159912109375, -5.24432373046875, -5.043487548828125, -4.8426513671875, -4.641815185546875, -4.44097900390625, -4.240142822265625, -4.039306640625, -3.838470458984375, -3.63763427734375, -3.436798095703125, -3.2359619140625, -3.035125732421875, -2.83428955078125, -2.633453369140625, -2.4326171875, -2.231781005859375, -2.03094482421875, -1.830108642578125, -1.6292724609375, -1.428436279296875, -1.22760009765625, -1.026763916015625, -0.825927734375, -0.625091552734375, -0.42425537109375, -0.223419189453125, -0.0225830078125, 0.178253173828125, 0.37908935546875, 0.579925537109375, 0.78076171875, 0.981597900390625, 1.18243408203125, 1.383270263671875, 1.5841064453125, 1.784942626953125, 1.98577880859375, 2.186614990234375, 2.387451171875, 2.588287353515625, 2.78912353515625, 2.989959716796875, 3.1907958984375, 3.391632080078125, 3.59246826171875, 3.793304443359375, 3.994140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 58.0, 217.0, 2496.0, 1014.0, 168.0, 65.0, 23.0, 17.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.556396484375, -0.537109375, -0.517822265625, -0.49853515625, -0.479248046875, -0.4599609375, -0.440673828125, -0.42138671875, -0.402099609375, -0.3828125, -0.363525390625, -0.34423828125, -0.324951171875, -0.3056640625, -0.286376953125, -0.26708984375, -0.247802734375, -0.228515625, -0.209228515625, -0.18994140625, -0.170654296875, -0.1513671875, -0.132080078125, -0.11279296875, -0.093505859375, -0.07421875, -0.054931640625, -0.03564453125, -0.016357421875, 0.0029296875, 0.022216796875, 0.04150390625, 0.060791015625, 0.080078125, 0.099365234375, 0.11865234375, 0.137939453125, 0.1572265625, 0.176513671875, 0.19580078125, 0.215087890625, 0.234375, 0.253662109375, 0.27294921875, 0.292236328125, 0.3115234375, 0.330810546875, 0.35009765625, 0.369384765625, 0.388671875, 0.407958984375, 0.42724609375, 0.446533203125, 0.4658203125, 0.485107421875, 0.50439453125, 0.523681640625, 0.54296875, 0.562255859375, 0.58154296875, 0.600830078125, 0.6201171875, 0.639404296875, 0.65869140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 24.0, 86.0, 252.0, 373.0, 178.0, 42.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1140847206115723, -2.952277660369873, -2.790470600128174, -2.6286633014678955, -2.4668562412261963, -2.305049180984497, -2.1432418823242188, -1.9814348220825195, -1.8196277618408203, -1.657820701599121, -1.4960135221481323, -1.3342063426971436, -1.1723992824554443, -1.0105922222137451, -0.8487850427627563, -0.6869778633117676, -0.5251708030700684, -0.36336368322372437, -0.20155656337738037, -0.03974944353103638, 0.12205767631530762, 0.2838647961616516, 0.4456719160079956, 0.6074790954589844, 0.7692861557006836, 0.9310932755470276, 1.0929003953933716, 1.2547075748443604, 1.4165146350860596, 1.5783216953277588, 1.7401288747787476, 1.9019360542297363, 2.0637435913085938, 2.225550651550293, 2.387357711791992, 2.5491650104522705, 2.7109720706939697, 2.872779130935669, 3.0345864295959473, 3.1963934898376465, 3.3582005500793457, 3.520007610321045, 3.681814670562744, 3.8436219692230225, 4.005429267883301, 4.167236328125, 4.329043388366699, 4.490850448608398, 4.652657508850098, 4.814464569091797, 4.976271629333496, 5.138078689575195, 5.2998857498168945, 5.461693286895752, 5.623500347137451, 5.78530740737915, 5.94711446762085, 6.108921527862549, 6.270728588104248, 6.432535648345947, 6.594343185424805, 6.756150245666504, 6.917957305908203, 7.079764366149902, 7.241571426391602]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 24.0, 16.0, 31.0, 35.0, 42.0, 54.0, 64.0, 62.0, 75.0, 72.0, 74.0, 64.0, 66.0, 49.0, 51.0, 47.0, 45.0, 26.0, 21.0, 16.0, 12.0, 10.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380401849746704, -1.3349392414093018, -1.2894765138626099, -1.2440139055252075, -1.1985511779785156, -1.1530885696411133, -1.107625961303711, -1.062163233757019, -1.0167005062103271, -0.97123783826828, -0.9257751703262329, -0.8803125619888306, -0.8348498344421387, -0.7893872261047363, -0.7439245581626892, -0.6984618902206421, -0.6529992818832397, -0.6075366139411926, -0.5620739459991455, -0.5166113376617432, -0.47114863991737366, -0.42568597197532654, -0.3802233338356018, -0.3347606658935547, -0.28929799795150757, -0.24383533000946045, -0.19837267696857452, -0.1529100239276886, -0.10744735598564148, -0.06198468804359436, -0.01652204990386963, 0.02894061803817749, 0.07440328598022461, 0.11986594647169113, 0.16532860696315765, 0.21079126000404358, 0.2562539279460907, 0.3017165958881378, 0.34717923402786255, 0.39264190196990967, 0.4381045699119568, 0.4835672378540039, 0.529029905796051, 0.5744925737380981, 0.6199551820755005, 0.6654179096221924, 0.7108805179595947, 0.7563431859016418, 0.801805853843689, 0.8472685217857361, 0.8927311897277832, 0.9381937980651855, 0.9836565256118774, 1.0291191339492798, 1.0745818614959717, 1.120044469833374, 1.1655070781707764, 1.2109696865081787, 1.2564324140548706, 1.301895022392273, 1.3473577499389648, 1.3928203582763672, 1.4382829666137695, 1.4837456941604614, 1.5292084217071533]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 6.0, 12.0, 4.0, 13.0, 31.0, 26.0, 39.0, 58.0, 105.0, 206.0, 694.0, 4768.0, 166775.0, 854547.0, 18932.0, 1585.0, 359.0, 118.0, 71.0, 51.0, 35.0, 40.0, 29.0, 11.0, 9.0, 4.0, 8.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.8203125, -2.72705078125, -2.6337890625, -2.54052734375, -2.447265625, -2.35400390625, -2.2607421875, -2.16748046875, -2.07421875, -1.98095703125, -1.8876953125, -1.79443359375, -1.701171875, -1.60791015625, -1.5146484375, -1.42138671875, -1.328125, -1.23486328125, -1.1416015625, -1.04833984375, -0.955078125, -0.86181640625, -0.7685546875, -0.67529296875, -0.58203125, -0.48876953125, -0.3955078125, -0.30224609375, -0.208984375, -0.11572265625, -0.0224609375, 0.07080078125, 0.1640625, 0.25732421875, 0.3505859375, 0.44384765625, 0.537109375, 0.63037109375, 0.7236328125, 0.81689453125, 0.91015625, 1.00341796875, 1.0966796875, 1.18994140625, 1.283203125, 1.37646484375, 1.4697265625, 1.56298828125, 1.65625, 1.74951171875, 1.8427734375, 1.93603515625, 2.029296875, 2.12255859375, 2.2158203125, 2.30908203125, 2.40234375, 2.49560546875, 2.5888671875, 2.68212890625, 2.775390625, 2.86865234375, 2.9619140625, 3.05517578125, 3.1484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 19.0, 66.0, 108.0, 186.0, 205.0, 212.0, 111.0, 65.0, 24.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3876628875732422, -0.3793296813964844, -0.37099647521972656, -0.36266326904296875, -0.35433006286621094, -0.3459968566894531, -0.3376636505126953, -0.3293304443359375, -0.3209972381591797, -0.3126640319824219, -0.30433082580566406, -0.29599761962890625, -0.28766441345214844, -0.2793312072753906, -0.2709980010986328, -0.262664794921875, -0.2543315887451172, -0.24599838256835938, -0.23766517639160156, -0.22933197021484375, -0.22099876403808594, -0.21266555786132812, -0.2043323516845703, -0.1959991455078125, -0.1876659393310547, -0.17933273315429688, -0.17099952697753906, -0.16266632080078125, -0.15433311462402344, -0.14599990844726562, -0.1376667022705078, -0.12933349609375, -0.12100028991699219, -0.11266708374023438, -0.10433387756347656, -0.09600067138671875, -0.08766746520996094, -0.07933425903320312, -0.07100105285644531, -0.0626678466796875, -0.05433464050292969, -0.046001434326171875, -0.03766822814941406, -0.02933502197265625, -0.021001815795898438, -0.012668609619140625, -0.0043354034423828125, 0.003997802734375, 0.012331008911132812, 0.020664215087890625, 0.028997421264648438, 0.03733062744140625, 0.04566383361816406, 0.053997039794921875, 0.06233024597167969, 0.0706634521484375, 0.07899665832519531, 0.08732986450195312, 0.09566307067871094, 0.10399627685546875, 0.11232948303222656, 0.12066268920898438, 0.1289958953857422, 0.1373291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 9.0, 10.0, 6.0, 11.0, 17.0, 20.0, 31.0, 23.0, 47.0, 41.0, 79.0, 141.0, 190.0, 323.0, 527.0, 1109.0, 2520.0, 7633.0, 31246.0, 171401.0, 564230.0, 216419.0, 38059.0, 8921.0, 2869.0, 1172.0, 567.0, 321.0, 213.0, 108.0, 79.0, 58.0, 46.0, 26.0, 21.0, 23.0, 13.0, 16.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.837890625, -0.81292724609375, -0.7879638671875, -0.76300048828125, -0.738037109375, -0.71307373046875, -0.6881103515625, -0.66314697265625, -0.63818359375, -0.61322021484375, -0.5882568359375, -0.56329345703125, -0.538330078125, -0.51336669921875, -0.4884033203125, -0.46343994140625, -0.4384765625, -0.41351318359375, -0.3885498046875, -0.36358642578125, -0.338623046875, -0.31365966796875, -0.2886962890625, -0.26373291015625, -0.23876953125, -0.21380615234375, -0.1888427734375, -0.16387939453125, -0.138916015625, -0.11395263671875, -0.0889892578125, -0.06402587890625, -0.0390625, -0.01409912109375, 0.0108642578125, 0.03582763671875, 0.060791015625, 0.08575439453125, 0.1107177734375, 0.13568115234375, 0.16064453125, 0.18560791015625, 0.2105712890625, 0.23553466796875, 0.260498046875, 0.28546142578125, 0.3104248046875, 0.33538818359375, 0.3603515625, 0.38531494140625, 0.4102783203125, 0.43524169921875, 0.460205078125, 0.48516845703125, 0.5101318359375, 0.53509521484375, 0.56005859375, 0.58502197265625, 0.6099853515625, 0.63494873046875, 0.659912109375, 0.68487548828125, 0.7098388671875, 0.73480224609375, 0.759765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 3.0, 8.0, 8.0, 9.0, 10.0, 12.0, 11.0, 6.0, 28.0, 30.0, 40.0, 32.0, 40.0, 48.0, 63.0, 36.0, 52.0, 38.0, 59.0, 52.0, 49.0, 49.0, 41.0, 32.0, 38.0, 34.0, 26.0, 15.0, 24.0, 22.0, 14.0, 12.0, 9.0, 12.0, 5.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.4345703125, -0.422210693359375, -0.40985107421875, -0.397491455078125, -0.3851318359375, -0.372772216796875, -0.36041259765625, -0.348052978515625, -0.335693359375, -0.323333740234375, -0.31097412109375, -0.298614501953125, -0.2862548828125, -0.273895263671875, -0.26153564453125, -0.249176025390625, -0.23681640625, -0.224456787109375, -0.21209716796875, -0.199737548828125, -0.1873779296875, -0.175018310546875, -0.16265869140625, -0.150299072265625, -0.137939453125, -0.125579833984375, -0.11322021484375, -0.100860595703125, -0.0885009765625, -0.076141357421875, -0.06378173828125, -0.051422119140625, -0.0390625, -0.026702880859375, -0.01434326171875, -0.001983642578125, 0.0103759765625, 0.022735595703125, 0.03509521484375, 0.047454833984375, 0.059814453125, 0.072174072265625, 0.08453369140625, 0.096893310546875, 0.1092529296875, 0.121612548828125, 0.13397216796875, 0.146331787109375, 0.15869140625, 0.171051025390625, 0.18341064453125, 0.195770263671875, 0.2081298828125, 0.220489501953125, 0.23284912109375, 0.245208740234375, 0.257568359375, 0.269927978515625, 0.28228759765625, 0.294647216796875, 0.3070068359375, 0.319366455078125, 0.33172607421875, 0.344085693359375, 0.3564453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 10.0, 18.0, 38.0, 33.0, 68.0, 118.0, 237.0, 493.0, 1407.0, 7410.0, 116903.0, 886979.0, 29389.0, 3751.0, 903.0, 341.0, 164.0, 104.0, 63.0, 33.0, 26.0, 14.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5951080322265625, -1.548614501953125, -1.5021209716796875, -1.45562744140625, -1.4091339111328125, -1.362640380859375, -1.3161468505859375, -1.2696533203125, -1.2231597900390625, -1.176666259765625, -1.1301727294921875, -1.08367919921875, -1.0371856689453125, -0.990692138671875, -0.9441986083984375, -0.897705078125, -0.8512115478515625, -0.804718017578125, -0.7582244873046875, -0.71173095703125, -0.6652374267578125, -0.618743896484375, -0.5722503662109375, -0.5257568359375, -0.4792633056640625, -0.432769775390625, -0.3862762451171875, -0.33978271484375, -0.2932891845703125, -0.246795654296875, -0.2003021240234375, -0.15380859375, -0.1073150634765625, -0.060821533203125, -0.0143280029296875, 0.03216552734375, 0.0786590576171875, 0.125152587890625, 0.1716461181640625, 0.2181396484375, 0.2646331787109375, 0.311126708984375, 0.3576202392578125, 0.40411376953125, 0.4506072998046875, 0.497100830078125, 0.5435943603515625, 0.590087890625, 0.6365814208984375, 0.683074951171875, 0.7295684814453125, 0.77606201171875, 0.8225555419921875, 0.869049072265625, 0.9155426025390625, 0.9620361328125, 1.0085296630859375, 1.055023193359375, 1.1015167236328125, 1.14801025390625, 1.1945037841796875, 1.240997314453125, 1.2874908447265625, 1.333984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 13.0, 15.0, 29.0, 33.0, 44.0, 102.0, 161.0, 191.0, 164.0, 116.0, 59.0, 23.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012600421905517578, -0.00012107379734516144, -0.0001161433756351471, -0.00011121295392513275, -0.00010628253221511841, -0.00010135211050510406, -9.642168879508972e-05, -9.149126708507538e-05, -8.656084537506104e-05, -8.163042366504669e-05, -7.670000195503235e-05, -7.1769580245018e-05, -6.683915853500366e-05, -6.190873682498932e-05, -5.6978315114974976e-05, -5.204789340496063e-05, -4.711747169494629e-05, -4.2187049984931946e-05, -3.72566282749176e-05, -3.232620656490326e-05, -2.7395784854888916e-05, -2.2465363144874573e-05, -1.753494143486023e-05, -1.2604519724845886e-05, -7.674098014831543e-06, -2.7436763048171997e-06, 2.1867454051971436e-06, 7.117167115211487e-06, 1.204758882522583e-05, 1.6978010535240173e-05, 2.1908432245254517e-05, 2.683885395526886e-05, 3.17692756652832e-05, 3.6699697375297546e-05, 4.163011908531189e-05, 4.656054079532623e-05, 5.1490962505340576e-05, 5.642138421535492e-05, 6.135180592536926e-05, 6.62822276353836e-05, 7.121264934539795e-05, 7.614307105541229e-05, 8.107349276542664e-05, 8.600391447544098e-05, 9.093433618545532e-05, 9.586475789546967e-05, 0.00010079517960548401, 0.00010572560131549835, 0.0001106560230255127, 0.00011558644473552704, 0.00012051686644554138, 0.00012544728815555573, 0.00013037770986557007, 0.0001353081315755844, 0.00014023855328559875, 0.0001451689749956131, 0.00015009939670562744, 0.00015502981841564178, 0.00015996024012565613, 0.00016489066183567047, 0.00016982108354568481, 0.00017475150525569916, 0.0001796819269657135, 0.00018461234867572784, 0.0001895427703857422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 8.0, 10.0, 23.0, 34.0, 49.0, 68.0, 151.0, 320.0, 806.0, 2764.0, 13564.0, 212739.0, 772559.0, 37612.0, 5510.0, 1411.0, 478.0, 187.0, 91.0, 57.0, 28.0, 18.0, 7.0, 12.0, 14.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.421875, -1.3846893310546875, -1.347503662109375, -1.3103179931640625, -1.27313232421875, -1.2359466552734375, -1.198760986328125, -1.1615753173828125, -1.1243896484375, -1.0872039794921875, -1.050018310546875, -1.0128326416015625, -0.97564697265625, -0.9384613037109375, -0.901275634765625, -0.8640899658203125, -0.826904296875, -0.7897186279296875, -0.752532958984375, -0.7153472900390625, -0.67816162109375, -0.6409759521484375, -0.603790283203125, -0.5666046142578125, -0.5294189453125, -0.4922332763671875, -0.455047607421875, -0.4178619384765625, -0.38067626953125, -0.3434906005859375, -0.306304931640625, -0.2691192626953125, -0.23193359375, -0.1947479248046875, -0.157562255859375, -0.1203765869140625, -0.08319091796875, -0.0460052490234375, -0.008819580078125, 0.0283660888671875, 0.0655517578125, 0.1027374267578125, 0.139923095703125, 0.1771087646484375, 0.21429443359375, 0.2514801025390625, 0.288665771484375, 0.3258514404296875, 0.363037109375, 0.4002227783203125, 0.437408447265625, 0.4745941162109375, 0.51177978515625, 0.5489654541015625, 0.586151123046875, 0.6233367919921875, 0.6605224609375, 0.6977081298828125, 0.734893798828125, 0.7720794677734375, 0.80926513671875, 0.8464508056640625, 0.883636474609375, 0.9208221435546875, 0.9580078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 9.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 10.0, 18.0, 46.0, 58.0, 86.0, 149.0, 157.0, 143.0, 107.0, 65.0, 51.0, 29.0, 16.0, 11.0, 7.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.65234375, -0.6367225646972656, -0.6211013793945312, -0.6054801940917969, -0.5898590087890625, -0.5742378234863281, -0.5586166381835938, -0.5429954528808594, -0.527374267578125, -0.5117530822753906, -0.49613189697265625, -0.4805107116699219, -0.4648895263671875, -0.4492683410644531, -0.43364715576171875, -0.4180259704589844, -0.40240478515625, -0.3867835998535156, -0.37116241455078125, -0.3555412292480469, -0.3399200439453125, -0.3242988586425781, -0.30867767333984375, -0.2930564880371094, -0.277435302734375, -0.2618141174316406, -0.24619293212890625, -0.23057174682617188, -0.2149505615234375, -0.19932937622070312, -0.18370819091796875, -0.16808700561523438, -0.1524658203125, -0.13684463500976562, -0.12122344970703125, -0.10560226440429688, -0.0899810791015625, -0.07435989379882812, -0.05873870849609375, -0.043117523193359375, -0.027496337890625, -0.011875152587890625, 0.00374603271484375, 0.019367218017578125, 0.0349884033203125, 0.050609588623046875, 0.06623077392578125, 0.08185195922851562, 0.09747314453125, 0.11309432983398438, 0.12871551513671875, 0.14433670043945312, 0.1599578857421875, 0.17557907104492188, 0.19120025634765625, 0.20682144165039062, 0.222442626953125, 0.23806381225585938, 0.25368499755859375, 0.2693061828613281, 0.2849273681640625, 0.3005485534667969, 0.31616973876953125, 0.3317909240722656, 0.347412109375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 166.0, 696.0, 125.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.394973754882812, -12.669388771057129, -11.943802833557129, -11.218217849731445, -10.492631912231445, -9.767046928405762, -9.041461944580078, -8.315876007080078, -7.5902910232543945, -6.864705562591553, -6.139120101928711, -5.413535118103027, -4.6879496574401855, -3.9623641967773438, -3.23677921295166, -2.5111937522888184, -1.7856082916259766, -1.0600229501724243, -0.33443760871887207, 0.3911476135253906, 1.1167330741882324, 1.8423185348510742, 2.567903518676758, 3.2934889793395996, 4.019074440002441, 4.744659900665283, 5.470245361328125, 6.195830345153809, 6.92141580581665, 7.647001266479492, 8.372586250305176, 9.09817123413086, 9.82375717163086, 10.549342155456543, 11.274928092956543, 12.000513076782227, 12.726099014282227, 13.45168399810791, 14.177268981933594, 14.902854919433594, 15.628439903259277, 16.35402488708496, 17.07961082458496, 17.805194854736328, 18.530780792236328, 19.256366729736328, 19.981952667236328, 20.707536697387695, 21.433122634887695, 22.158708572387695, 22.884292602539062, 23.609878540039062, 24.335464477539062, 25.061050415039062, 25.78663444519043, 26.51222038269043, 27.237804412841797, 27.963390350341797, 28.688974380493164, 29.414560317993164, 30.140146255493164, 30.86573028564453, 31.59131622314453, 32.31690216064453, 33.04248809814453]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 16.0, 20.0, 17.0, 28.0, 34.0, 45.0, 58.0, 57.0, 59.0, 65.0, 76.0, 87.0, 76.0, 74.0, 53.0, 49.0, 48.0, 35.0, 33.0, 23.0, 16.0, 11.0, 5.0, 9.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.332628011703491, -3.1939985752105713, -3.0553689002990723, -2.9167394638061523, -2.7781097888946533, -2.6394803524017334, -2.5008506774902344, -2.3622212409973145, -2.2235918045043945, -2.0849623680114746, -1.9463326930999756, -1.8077032566070557, -1.6690735816955566, -1.5304441452026367, -1.3918145895004272, -1.2531850337982178, -1.1145553588867188, -0.9759258031845093, -0.8372962474822998, -0.6986667513847351, -0.5600371956825256, -0.42140763998031616, -0.28277814388275146, -0.144148588180542, -0.0055190324783325195, 0.13311050832271576, 0.27174004912376404, 0.4103695750236511, 0.5489991307258606, 0.6876286864280701, 0.8262581825256348, 0.9648877382278442, 1.1035170555114746, 1.242146611213684, 1.3807761669158936, 1.5194056034088135, 1.6580352783203125, 1.7966647148132324, 1.935294270515442, 2.0739238262176514, 2.2125535011291504, 2.3511829376220703, 2.4898126125335693, 2.6284420490264893, 2.7670717239379883, 2.905701160430908, 3.044330596923828, 3.182960271835327, 3.321589708328247, 3.460219144821167, 3.598848819732666, 3.737478256225586, 3.876107931137085, 4.014737606048584, 4.153367042541504, 4.291996479034424, 4.430625915527344, 4.569255352020264, 4.707884788513184, 4.846514701843262, 4.985144138336182, 5.123773574829102, 5.2624030113220215, 5.401032447814941, 5.5396623611450195]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 13.0, 22.0, 20.0, 20.0, 20.0, 40.0, 30.0, 31.0, 43.0, 66.0, 83.0, 130.0, 291.0, 831.0, 3318.0, 26825.0, 3333543.0, 804908.0, 20220.0, 2728.0, 622.0, 219.0, 102.0, 50.0, 20.0, 13.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46875, -3.38189697265625, -3.2950439453125, -3.20819091796875, -3.121337890625, -3.03448486328125, -2.9476318359375, -2.86077880859375, -2.77392578125, -2.68707275390625, -2.6002197265625, -2.51336669921875, -2.426513671875, -2.33966064453125, -2.2528076171875, -2.16595458984375, -2.0791015625, -1.99224853515625, -1.9053955078125, -1.81854248046875, -1.731689453125, -1.64483642578125, -1.5579833984375, -1.47113037109375, -1.38427734375, -1.29742431640625, -1.2105712890625, -1.12371826171875, -1.036865234375, -0.95001220703125, -0.8631591796875, -0.77630615234375, -0.689453125, -0.60260009765625, -0.5157470703125, -0.42889404296875, -0.342041015625, -0.25518798828125, -0.1683349609375, -0.08148193359375, 0.00537109375, 0.09222412109375, 0.1790771484375, 0.26593017578125, 0.352783203125, 0.43963623046875, 0.5264892578125, 0.61334228515625, 0.7001953125, 0.78704833984375, 0.8739013671875, 0.96075439453125, 1.047607421875, 1.13446044921875, 1.2213134765625, 1.30816650390625, 1.39501953125, 1.48187255859375, 1.5687255859375, 1.65557861328125, 1.742431640625, 1.82928466796875, 1.9161376953125, 2.00299072265625, 2.08984375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 18.0, 38.0, 51.0, 77.0, 118.0, 153.0, 136.0, 122.0, 111.0, 77.0, 42.0, 23.0, 16.0, 12.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33642578125, -0.32973575592041016, -0.3230457305908203, -0.31635570526123047, -0.3096656799316406, -0.3029756546020508, -0.29628562927246094, -0.2895956039428711, -0.28290557861328125, -0.2762155532836914, -0.26952552795410156, -0.2628355026245117, -0.2561454772949219, -0.24945545196533203, -0.2427654266357422, -0.23607540130615234, -0.2293853759765625, -0.22269535064697266, -0.2160053253173828, -0.20931529998779297, -0.20262527465820312, -0.19593524932861328, -0.18924522399902344, -0.1825551986694336, -0.17586517333984375, -0.1691751480102539, -0.16248512268066406, -0.15579509735107422, -0.14910507202148438, -0.14241504669189453, -0.1357250213623047, -0.12903499603271484, -0.122344970703125, -0.11565494537353516, -0.10896492004394531, -0.10227489471435547, -0.09558486938476562, -0.08889484405517578, -0.08220481872558594, -0.0755147933959961, -0.06882476806640625, -0.062134742736816406, -0.05544471740722656, -0.04875469207763672, -0.042064666748046875, -0.03537464141845703, -0.028684616088867188, -0.021994590759277344, -0.0153045654296875, -0.008614540100097656, -0.0019245147705078125, 0.004765510559082031, 0.011455535888671875, 0.01814556121826172, 0.024835586547851562, 0.031525611877441406, 0.03821563720703125, 0.044905662536621094, 0.05159568786621094, 0.05828571319580078, 0.06497573852539062, 0.07166576385498047, 0.07835578918457031, 0.08504581451416016, 0.09173583984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 16.0, 20.0, 17.0, 28.0, 70.0, 100.0, 212.0, 599.0, 2686.0, 4050738.0, 137639.0, 1523.0, 335.0, 124.0, 69.0, 40.0, 28.0, 18.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.828125, -13.54522705078125, -13.2623291015625, -12.97943115234375, -12.696533203125, -12.41363525390625, -12.1307373046875, -11.84783935546875, -11.56494140625, -11.28204345703125, -10.9991455078125, -10.71624755859375, -10.433349609375, -10.15045166015625, -9.8675537109375, -9.58465576171875, -9.3017578125, -9.01885986328125, -8.7359619140625, -8.45306396484375, -8.170166015625, -7.88726806640625, -7.6043701171875, -7.32147216796875, -7.03857421875, -6.75567626953125, -6.4727783203125, -6.18988037109375, -5.906982421875, -5.62408447265625, -5.3411865234375, -5.05828857421875, -4.775390625, -4.49249267578125, -4.2095947265625, -3.92669677734375, -3.643798828125, -3.36090087890625, -3.0780029296875, -2.79510498046875, -2.51220703125, -2.22930908203125, -1.9464111328125, -1.66351318359375, -1.380615234375, -1.09771728515625, -0.8148193359375, -0.53192138671875, -0.2490234375, 0.03387451171875, 0.3167724609375, 0.59967041015625, 0.882568359375, 1.16546630859375, 1.4483642578125, 1.73126220703125, 2.01416015625, 2.29705810546875, 2.5799560546875, 2.86285400390625, 3.145751953125, 3.42864990234375, 3.7115478515625, 3.99444580078125, 4.27734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 10.0, 28.0, 65.0, 268.0, 2330.0, 1071.0, 191.0, 71.0, 24.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2294921875, -1.2062339782714844, -1.1829757690429688, -1.1597175598144531, -1.1364593505859375, -1.1132011413574219, -1.0899429321289062, -1.0666847229003906, -1.043426513671875, -1.0201683044433594, -0.9969100952148438, -0.9736518859863281, -0.9503936767578125, -0.9271354675292969, -0.9038772583007812, -0.8806190490722656, -0.85736083984375, -0.8341026306152344, -0.8108444213867188, -0.7875862121582031, -0.7643280029296875, -0.7410697937011719, -0.7178115844726562, -0.6945533752441406, -0.671295166015625, -0.6480369567871094, -0.6247787475585938, -0.6015205383300781, -0.5782623291015625, -0.5550041198730469, -0.5317459106445312, -0.5084877014160156, -0.4852294921875, -0.4619712829589844, -0.43871307373046875, -0.4154548645019531, -0.3921966552734375, -0.3689384460449219, -0.34568023681640625, -0.3224220275878906, -0.299163818359375, -0.2759056091308594, -0.25264739990234375, -0.22938919067382812, -0.2061309814453125, -0.18287277221679688, -0.15961456298828125, -0.13635635375976562, -0.11309814453125, -0.08983993530273438, -0.06658172607421875, -0.043323516845703125, -0.0200653076171875, 0.003192901611328125, 0.02645111083984375, 0.049709320068359375, 0.072967529296875, 0.09622573852539062, 0.11948394775390625, 0.14274215698242188, 0.1660003662109375, 0.18925857543945312, 0.21251678466796875, 0.23577499389648438, 0.259033203125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 13.0, 28.0, 74.0, 208.0, 366.0, 196.0, 58.0, 28.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.702433586120605, -8.515105247497559, -8.327775955200195, -8.140447616577148, -7.953118324279785, -7.765789985656738, -7.578461170196533, -7.391132354736328, -7.203803539276123, -7.016474723815918, -6.829145908355713, -6.641817092895508, -6.454488754272461, -6.267159938812256, -6.079831123352051, -5.892502307891846, -5.705173492431641, -5.5178446769714355, -5.3305158615112305, -5.143187046051025, -4.95585823059082, -4.768529891967773, -4.581201076507568, -4.393872261047363, -4.206543445587158, -4.019214630126953, -3.831885814666748, -3.644557237625122, -3.457228422164917, -3.269899606704712, -3.082571029663086, -2.895242214202881, -2.707913637161255, -2.52058482170105, -2.333256244659424, -2.1459274291992188, -1.9585986137390137, -1.7712697982788086, -1.583941102027893, -1.3966124057769775, -1.2092835903167725, -1.0219547748565674, -0.8346260786056519, -0.6472973227500916, -0.45996856689453125, -0.27263981103897095, -0.08531105518341064, 0.10201764106750488, 0.28934645652770996, 0.47667521238327026, 0.6640039682388306, 0.8513327240943909, 1.0386614799499512, 1.2259902954101562, 1.4133189916610718, 1.6006476879119873, 1.7879765033721924, 1.9753053188323975, 2.1626338958740234, 2.3499627113342285, 2.5372915267944336, 2.7246203422546387, 2.9119491577148438, 3.0992777347564697, 3.286606550216675]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 11.0, 26.0, 33.0, 47.0, 54.0, 87.0, 95.0, 101.0, 102.0, 98.0, 96.0, 73.0, 60.0, 39.0, 32.0, 11.0, 8.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0964064598083496, -3.000277519226074, -2.9041483402252197, -2.8080193996429443, -2.71189022064209, -2.6157612800598145, -2.519632339477539, -2.4235033988952637, -2.327374219894409, -2.231245279312134, -2.1351161003112793, -2.038987159729004, -1.942858099937439, -1.846729040145874, -1.7506000995635986, -1.6544710397720337, -1.5583419799804688, -1.4622129201889038, -1.3660838603973389, -1.2699549198150635, -1.1738258600234985, -1.0776968002319336, -0.9815678000450134, -0.8854387998580933, -0.7893097400665283, -0.6931806802749634, -0.5970516800880432, -0.500922679901123, -0.4047936201095581, -0.30866459012031555, -0.212535560131073, -0.11640655994415283, -0.020277738571166992, 0.07585129141807556, 0.17198032140731812, 0.26810935139656067, 0.3642383813858032, 0.4603674113750458, 0.5564964413642883, 0.6526254415512085, 0.7487545013427734, 0.8448835611343384, 0.9410125613212585, 1.0371415615081787, 1.1332706212997437, 1.2293996810913086, 1.325528621673584, 1.421657681465149, 1.5177867412567139, 1.6139158010482788, 1.7100448608398438, 1.8061738014221191, 1.902302861213684, 1.998431921005249, 2.0945608615875244, 2.190690040588379, 2.2868189811706543, 2.3829479217529297, 2.479077100753784, 2.5752060413360596, 2.671335220336914, 2.7674641609191895, 2.863593101501465, 2.9597220420837402, 3.0558512210845947]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 6.0, 7.0, 14.0, 28.0, 33.0, 38.0, 76.0, 106.0, 187.0, 356.0, 872.0, 2785.0, 15452.0, 193535.0, 761857.0, 62793.0, 7264.0, 1764.0, 621.0, 282.0, 158.0, 99.0, 65.0, 44.0, 24.0, 18.0, 14.0, 11.0, 11.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.468841552734375, -2.39471435546875, -2.320587158203125, -2.2464599609375, -2.172332763671875, -2.09820556640625, -2.024078369140625, -1.949951171875, -1.875823974609375, -1.80169677734375, -1.727569580078125, -1.6534423828125, -1.579315185546875, -1.50518798828125, -1.431060791015625, -1.35693359375, -1.282806396484375, -1.20867919921875, -1.134552001953125, -1.0604248046875, -0.986297607421875, -0.91217041015625, -0.838043212890625, -0.763916015625, -0.689788818359375, -0.61566162109375, -0.541534423828125, -0.4674072265625, -0.393280029296875, -0.31915283203125, -0.245025634765625, -0.1708984375, -0.096771240234375, -0.02264404296875, 0.051483154296875, 0.1256103515625, 0.199737548828125, 0.27386474609375, 0.347991943359375, 0.422119140625, 0.496246337890625, 0.57037353515625, 0.644500732421875, 0.7186279296875, 0.792755126953125, 0.86688232421875, 0.941009521484375, 1.01513671875, 1.089263916015625, 1.16339111328125, 1.237518310546875, 1.3116455078125, 1.385772705078125, 1.45989990234375, 1.534027099609375, 1.608154296875, 1.682281494140625, 1.75640869140625, 1.830535888671875, 1.9046630859375, 1.978790283203125, 2.05291748046875, 2.127044677734375, 2.201171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 16.0, 30.0, 46.0, 73.0, 87.0, 96.0, 136.0, 130.0, 105.0, 83.0, 71.0, 43.0, 28.0, 21.0, 10.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.38037109375, -0.3719196319580078, -0.3634681701660156, -0.35501670837402344, -0.34656524658203125, -0.33811378479003906, -0.3296623229980469, -0.3212108612060547, -0.3127593994140625, -0.3043079376220703, -0.2958564758300781, -0.28740501403808594, -0.27895355224609375, -0.27050209045410156, -0.2620506286621094, -0.2535991668701172, -0.245147705078125, -0.2366962432861328, -0.22824478149414062, -0.21979331970214844, -0.21134185791015625, -0.20289039611816406, -0.19443893432617188, -0.1859874725341797, -0.1775360107421875, -0.1690845489501953, -0.16063308715820312, -0.15218162536621094, -0.14373016357421875, -0.13527870178222656, -0.12682723999023438, -0.11837577819824219, -0.10992431640625, -0.10147285461425781, -0.09302139282226562, -0.08456993103027344, -0.07611846923828125, -0.06766700744628906, -0.059215545654296875, -0.05076408386230469, -0.0423126220703125, -0.03386116027832031, -0.025409698486328125, -0.016958236694335938, -0.00850677490234375, -5.53131103515625e-05, 0.008396148681640625, 0.016847610473632812, 0.025299072265625, 0.03375053405761719, 0.042201995849609375, 0.05065345764160156, 0.05910491943359375, 0.06755638122558594, 0.07600784301757812, 0.08445930480957031, 0.0929107666015625, 0.10136222839355469, 0.10981369018554688, 0.11826515197753906, 0.12671661376953125, 0.13516807556152344, 0.14361953735351562, 0.1520709991455078, 0.1605224609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 6.0, 10.0, 17.0, 19.0, 23.0, 47.0, 61.0, 103.0, 194.0, 325.0, 692.0, 1595.0, 3844.0, 11491.0, 50529.0, 337455.0, 523778.0, 91606.0, 17647.0, 5247.0, 1954.0, 845.0, 403.0, 225.0, 143.0, 84.0, 57.0, 26.0, 34.0, 19.0, 14.0, 12.0, 4.0, 10.0, 4.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.10906982421875, -1.0745849609375, -1.04010009765625, -1.005615234375, -0.97113037109375, -0.9366455078125, -0.90216064453125, -0.86767578125, -0.83319091796875, -0.7987060546875, -0.76422119140625, -0.729736328125, -0.69525146484375, -0.6607666015625, -0.62628173828125, -0.591796875, -0.55731201171875, -0.5228271484375, -0.48834228515625, -0.453857421875, -0.41937255859375, -0.3848876953125, -0.35040283203125, -0.31591796875, -0.28143310546875, -0.2469482421875, -0.21246337890625, -0.177978515625, -0.14349365234375, -0.1090087890625, -0.07452392578125, -0.0400390625, -0.00555419921875, 0.0289306640625, 0.06341552734375, 0.097900390625, 0.13238525390625, 0.1668701171875, 0.20135498046875, 0.23583984375, 0.27032470703125, 0.3048095703125, 0.33929443359375, 0.373779296875, 0.40826416015625, 0.4427490234375, 0.47723388671875, 0.51171875, 0.54620361328125, 0.5806884765625, 0.61517333984375, 0.649658203125, 0.68414306640625, 0.7186279296875, 0.75311279296875, 0.78759765625, 0.82208251953125, 0.8565673828125, 0.89105224609375, 0.925537109375, 0.96002197265625, 0.9945068359375, 1.02899169921875, 1.0634765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 9.0, 13.0, 12.0, 15.0, 16.0, 14.0, 19.0, 30.0, 43.0, 37.0, 34.0, 49.0, 46.0, 54.0, 40.0, 48.0, 69.0, 48.0, 52.0, 43.0, 38.0, 36.0, 40.0, 34.0, 28.0, 19.0, 22.0, 14.0, 16.0, 10.0, 15.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60498046875, -0.5870590209960938, -0.5691375732421875, -0.5512161254882812, -0.533294677734375, -0.5153732299804688, -0.4974517822265625, -0.47953033447265625, -0.46160888671875, -0.44368743896484375, -0.4257659912109375, -0.40784454345703125, -0.389923095703125, -0.37200164794921875, -0.3540802001953125, -0.33615875244140625, -0.3182373046875, -0.30031585693359375, -0.2823944091796875, -0.26447296142578125, -0.246551513671875, -0.22863006591796875, -0.2107086181640625, -0.19278717041015625, -0.17486572265625, -0.15694427490234375, -0.1390228271484375, -0.12110137939453125, -0.103179931640625, -0.08525848388671875, -0.0673370361328125, -0.04941558837890625, -0.031494140625, -0.01357269287109375, 0.0043487548828125, 0.02227020263671875, 0.040191650390625, 0.05811309814453125, 0.0760345458984375, 0.09395599365234375, 0.11187744140625, 0.12979888916015625, 0.1477203369140625, 0.16564178466796875, 0.183563232421875, 0.20148468017578125, 0.2194061279296875, 0.23732757568359375, 0.2552490234375, 0.27317047119140625, 0.2910919189453125, 0.30901336669921875, 0.326934814453125, 0.34485626220703125, 0.3627777099609375, 0.38069915771484375, 0.39862060546875, 0.41654205322265625, 0.4344635009765625, 0.45238494873046875, 0.470306396484375, 0.48822784423828125, 0.5061492919921875, 0.5240707397460938, 0.5419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 15.0, 14.0, 19.0, 40.0, 50.0, 111.0, 193.0, 404.0, 772.0, 1910.0, 5636.0, 25856.0, 371294.0, 590955.0, 39818.0, 7196.0, 2318.0, 966.0, 447.0, 189.0, 119.0, 71.0, 50.0, 29.0, 16.0, 21.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8400421142578125, -0.813873291015625, -0.7877044677734375, -0.76153564453125, -0.7353668212890625, -0.709197998046875, -0.6830291748046875, -0.6568603515625, -0.6306915283203125, -0.604522705078125, -0.5783538818359375, -0.55218505859375, -0.5260162353515625, -0.499847412109375, -0.4736785888671875, -0.447509765625, -0.4213409423828125, -0.395172119140625, -0.3690032958984375, -0.34283447265625, -0.3166656494140625, -0.290496826171875, -0.2643280029296875, -0.2381591796875, -0.2119903564453125, -0.185821533203125, -0.1596527099609375, -0.13348388671875, -0.1073150634765625, -0.081146240234375, -0.0549774169921875, -0.02880859375, -0.0026397705078125, 0.023529052734375, 0.0496978759765625, 0.07586669921875, 0.1020355224609375, 0.128204345703125, 0.1543731689453125, 0.1805419921875, 0.2067108154296875, 0.232879638671875, 0.2590484619140625, 0.28521728515625, 0.3113861083984375, 0.337554931640625, 0.3637237548828125, 0.389892578125, 0.4160614013671875, 0.442230224609375, 0.4683990478515625, 0.49456787109375, 0.5207366943359375, 0.546905517578125, 0.5730743408203125, 0.5992431640625, 0.6254119873046875, 0.651580810546875, 0.6777496337890625, 0.70391845703125, 0.7300872802734375, 0.756256103515625, 0.7824249267578125, 0.80859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 13.0, 19.0, 24.0, 28.0, 57.0, 73.0, 97.0, 120.0, 130.0, 124.0, 82.0, 57.0, 50.0, 30.0, 19.0, 14.0, 10.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012421607971191406, -0.00012098532170057297, -0.00011775456368923187, -0.00011452380567789078, -0.00011129304766654968, -0.00010806228965520859, -0.00010483153164386749, -0.0001016007736325264, -9.83700156211853e-05, -9.513925760984421e-05, -9.190849959850311e-05, -8.867774158716202e-05, -8.544698357582092e-05, -8.221622556447983e-05, -7.898546755313873e-05, -7.575470954179764e-05, -7.252395153045654e-05, -6.929319351911545e-05, -6.606243550777435e-05, -6.283167749643326e-05, -5.960091948509216e-05, -5.637016147375107e-05, -5.313940346240997e-05, -4.990864545106888e-05, -4.667788743972778e-05, -4.344712942838669e-05, -4.021637141704559e-05, -3.69856134057045e-05, -3.37548553943634e-05, -3.052409738302231e-05, -2.7293339371681213e-05, -2.406258136034012e-05, -2.0831823348999023e-05, -1.760106533765793e-05, -1.4370307326316833e-05, -1.1139549314975739e-05, -7.908791303634644e-06, -4.678033292293549e-06, -1.4472752809524536e-06, 1.7834827303886414e-06, 5.014240741729736e-06, 8.244998753070831e-06, 1.1475756764411926e-05, 1.4706514775753021e-05, 1.7937272787094116e-05, 2.116803079843521e-05, 2.4398788809776306e-05, 2.76295468211174e-05, 3.0860304832458496e-05, 3.409106284379959e-05, 3.7321820855140686e-05, 4.055257886648178e-05, 4.3783336877822876e-05, 4.701409488916397e-05, 5.0244852900505066e-05, 5.347561091184616e-05, 5.6706368923187256e-05, 5.993712693452835e-05, 6.316788494586945e-05, 6.639864295721054e-05, 6.962940096855164e-05, 7.286015897989273e-05, 7.609091699123383e-05, 7.932167500257492e-05, 8.255243301391602e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 22.0, 23.0, 59.0, 72.0, 126.0, 258.0, 509.0, 1002.0, 2267.0, 5979.0, 20589.0, 217102.0, 721806.0, 60927.0, 10816.0, 3737.0, 1551.0, 781.0, 384.0, 177.0, 108.0, 72.0, 43.0, 33.0, 20.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.896484375, -0.8710708618164062, -0.8456573486328125, -0.8202438354492188, -0.794830322265625, -0.7694168090820312, -0.7440032958984375, -0.7185897827148438, -0.69317626953125, -0.6677627563476562, -0.6423492431640625, -0.6169357299804688, -0.591522216796875, -0.5661087036132812, -0.5406951904296875, -0.5152816772460938, -0.4898681640625, -0.46445465087890625, -0.4390411376953125, -0.41362762451171875, -0.388214111328125, -0.36280059814453125, -0.3373870849609375, -0.31197357177734375, -0.28656005859375, -0.26114654541015625, -0.2357330322265625, -0.21031951904296875, -0.184906005859375, -0.15949249267578125, -0.1340789794921875, -0.10866546630859375, -0.083251953125, -0.05783843994140625, -0.0324249267578125, -0.00701141357421875, 0.018402099609375, 0.04381561279296875, 0.0692291259765625, 0.09464263916015625, 0.12005615234375, 0.14546966552734375, 0.1708831787109375, 0.19629669189453125, 0.221710205078125, 0.24712371826171875, 0.2725372314453125, 0.29795074462890625, 0.3233642578125, 0.34877777099609375, 0.3741912841796875, 0.39960479736328125, 0.425018310546875, 0.45043182373046875, 0.4758453369140625, 0.5012588500976562, 0.52667236328125, 0.5520858764648438, 0.5774993896484375, 0.6029129028320312, 0.628326416015625, 0.6537399291992188, 0.6791534423828125, 0.7045669555664062, 0.72998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 12.0, 7.0, 12.0, 12.0, 36.0, 66.0, 73.0, 125.0, 142.0, 158.0, 124.0, 87.0, 54.0, 37.0, 17.0, 11.0, 11.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6201171875, -0.6034126281738281, -0.5867080688476562, -0.5700035095214844, -0.5532989501953125, -0.5365943908691406, -0.5198898315429688, -0.5031852722167969, -0.486480712890625, -0.4697761535644531, -0.45307159423828125, -0.4363670349121094, -0.4196624755859375, -0.4029579162597656, -0.38625335693359375, -0.3695487976074219, -0.35284423828125, -0.3361396789550781, -0.31943511962890625, -0.3027305603027344, -0.2860260009765625, -0.2693214416503906, -0.25261688232421875, -0.23591232299804688, -0.219207763671875, -0.20250320434570312, -0.18579864501953125, -0.16909408569335938, -0.1523895263671875, -0.13568496704101562, -0.11898040771484375, -0.10227584838867188, -0.0855712890625, -0.06886672973632812, -0.05216217041015625, -0.035457611083984375, -0.0187530517578125, -0.002048492431640625, 0.01465606689453125, 0.031360626220703125, 0.048065185546875, 0.06476974487304688, 0.08147430419921875, 0.09817886352539062, 0.1148834228515625, 0.13158798217773438, 0.14829254150390625, 0.16499710083007812, 0.18170166015625, 0.19840621948242188, 0.21511077880859375, 0.23181533813476562, 0.2485198974609375, 0.2652244567871094, 0.28192901611328125, 0.2986335754394531, 0.315338134765625, 0.3320426940917969, 0.34874725341796875, 0.3654518127441406, 0.3821563720703125, 0.3988609313964844, 0.41556549072265625, 0.4322700500488281, 0.448974609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 73.0, 343.0, 463.0, 103.0, 17.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.177642822265625, -25.555749893188477, -24.93385887145996, -24.311965942382812, -23.690074920654297, -23.06818199157715, -22.4462890625, -21.824398040771484, -21.202505111694336, -20.580612182617188, -19.958721160888672, -19.336828231811523, -18.714935302734375, -18.09304428100586, -17.47115135192871, -16.849258422851562, -16.227367401123047, -15.605475425720215, -14.983583450317383, -14.361690521240234, -13.739798545837402, -13.11790657043457, -12.496013641357422, -11.87412166595459, -11.252229690551758, -10.630337715148926, -10.008445739746094, -9.386552810668945, -8.764660835266113, -8.142768859863281, -7.520876407623291, -6.898983955383301, -6.277091026306152, -5.65519905090332, -5.03330659866333, -4.41141414642334, -3.789522171020508, -3.1676299571990967, -2.5457377433776855, -1.9238452911376953, -1.3019533157348633, -0.6800611019134521, -0.058168888092041016, 0.5637233257293701, 1.1856155395507812, 1.8075077533721924, 2.4293999671936035, 3.0512924194335938, 3.673184394836426, 4.295076370239258, 4.916968822479248, 5.538861274719238, 6.16075325012207, 6.782645225524902, 7.404537677764893, 8.026430130004883, 8.648322105407715, 9.270214080810547, 9.892107009887695, 10.513998985290527, 11.13589096069336, 11.757782936096191, 12.379674911499023, 13.001567840576172, 13.623459815979004]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 14.0, 15.0, 26.0, 13.0, 28.0, 23.0, 30.0, 34.0, 36.0, 50.0, 50.0, 57.0, 55.0, 38.0, 50.0, 61.0, 41.0, 46.0, 43.0, 29.0, 37.0, 27.0, 22.0, 28.0, 21.0, 15.0, 14.0, 21.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1218209266662598, -3.0180411338806152, -2.91426157951355, -2.8104817867279053, -2.70670223236084, -2.6029224395751953, -2.49914288520813, -2.3953630924224854, -2.29158353805542, -2.1878037452697754, -2.08402419090271, -1.980244517326355, -1.87646484375, -1.7726850509643555, -1.66890549659729, -1.5651257038116455, -1.4613460302352905, -1.3575663566589355, -1.2537866830825806, -1.1500070095062256, -1.0462273359298706, -0.9424476027488708, -0.8386679291725159, -0.7348882555961609, -0.6311085820198059, -0.5273289084434509, -0.42354923486709595, -0.3197695314884186, -0.2159898579120636, -0.11221015453338623, -0.00843048095703125, 0.09534919261932373, 0.1991288661956787, 0.3029085397720337, 0.40668821334838867, 0.5104678869247437, 0.6142475605010986, 0.7180272936820984, 0.8218069672584534, 0.9255866408348083, 1.0293662548065186, 1.1331459283828735, 1.2369256019592285, 1.3407052755355835, 1.4444849491119385, 1.548264741897583, 1.6520442962646484, 1.755824089050293, 1.859603762626648, 1.963383436203003, 2.0671632289886475, 2.170942783355713, 2.2747225761413574, 2.378502130508423, 2.4822819232940674, 2.586061477661133, 2.6898412704467773, 2.793621063232422, 2.8974006175994873, 3.001180410385132, 3.1049599647521973, 3.208739757537842, 3.3125193119049072, 3.4162991046905518, 3.520078659057617]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 7.0, 13.0, 8.0, 12.0, 17.0, 16.0, 23.0, 31.0, 33.0, 48.0, 71.0, 85.0, 126.0, 191.0, 301.0, 586.0, 1353.0, 4204.0, 18399.0, 178563.0, 3909916.0, 64907.0, 10893.0, 2754.0, 924.0, 415.0, 171.0, 109.0, 38.0, 21.0, 16.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.89697265625, -2.8193359375, -2.74169921875, -2.6640625, -2.58642578125, -2.5087890625, -2.43115234375, -2.353515625, -2.27587890625, -2.1982421875, -2.12060546875, -2.04296875, -1.96533203125, -1.8876953125, -1.81005859375, -1.732421875, -1.65478515625, -1.5771484375, -1.49951171875, -1.421875, -1.34423828125, -1.2666015625, -1.18896484375, -1.111328125, -1.03369140625, -0.9560546875, -0.87841796875, -0.80078125, -0.72314453125, -0.6455078125, -0.56787109375, -0.490234375, -0.41259765625, -0.3349609375, -0.25732421875, -0.1796875, -0.10205078125, -0.0244140625, 0.05322265625, 0.130859375, 0.20849609375, 0.2861328125, 0.36376953125, 0.44140625, 0.51904296875, 0.5966796875, 0.67431640625, 0.751953125, 0.82958984375, 0.9072265625, 0.98486328125, 1.0625, 1.14013671875, 1.2177734375, 1.29541015625, 1.373046875, 1.45068359375, 1.5283203125, 1.60595703125, 1.68359375, 1.76123046875, 1.8388671875, 1.91650390625, 1.994140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 13.0, 20.0, 36.0, 46.0, 73.0, 102.0, 94.0, 135.0, 120.0, 102.0, 87.0, 65.0, 36.0, 30.0, 13.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.402099609375, -0.3930950164794922, -0.3840904235839844, -0.37508583068847656, -0.36608123779296875, -0.35707664489746094, -0.3480720520019531, -0.3390674591064453, -0.3300628662109375, -0.3210582733154297, -0.3120536804199219, -0.30304908752441406, -0.29404449462890625, -0.28503990173339844, -0.2760353088378906, -0.2670307159423828, -0.258026123046875, -0.2490215301513672, -0.24001693725585938, -0.23101234436035156, -0.22200775146484375, -0.21300315856933594, -0.20399856567382812, -0.1949939727783203, -0.1859893798828125, -0.1769847869873047, -0.16798019409179688, -0.15897560119628906, -0.14997100830078125, -0.14096641540527344, -0.13196182250976562, -0.12295722961425781, -0.11395263671875, -0.10494804382324219, -0.09594345092773438, -0.08693885803222656, -0.07793426513671875, -0.06892967224121094, -0.059925079345703125, -0.05092048645019531, -0.0419158935546875, -0.03291130065917969, -0.023906707763671875, -0.014902114868164062, -0.00589752197265625, 0.0031070709228515625, 0.012111663818359375, 0.021116256713867188, 0.030120849609375, 0.03912544250488281, 0.048130035400390625, 0.05713462829589844, 0.06613922119140625, 0.07514381408691406, 0.08414840698242188, 0.09315299987792969, 0.1021575927734375, 0.11116218566894531, 0.12016677856445312, 0.12917137145996094, 0.13817596435546875, 0.14718055725097656, 0.15618515014648438, 0.1651897430419922, 0.1741943359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 21.0, 12.0, 23.0, 40.0, 52.0, 68.0, 124.0, 184.0, 401.0, 2177.0, 125713.0, 4058237.0, 6094.0, 636.0, 203.0, 106.0, 62.0, 38.0, 34.0, 21.0, 13.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.754241943359375, -7.57879638671875, -7.403350830078125, -7.2279052734375, -7.052459716796875, -6.87701416015625, -6.701568603515625, -6.526123046875, -6.350677490234375, -6.17523193359375, -5.999786376953125, -5.8243408203125, -5.648895263671875, -5.47344970703125, -5.298004150390625, -5.12255859375, -4.947113037109375, -4.77166748046875, -4.596221923828125, -4.4207763671875, -4.245330810546875, -4.06988525390625, -3.894439697265625, -3.718994140625, -3.543548583984375, -3.36810302734375, -3.192657470703125, -3.0172119140625, -2.841766357421875, -2.66632080078125, -2.490875244140625, -2.3154296875, -2.139984130859375, -1.96453857421875, -1.789093017578125, -1.6136474609375, -1.438201904296875, -1.26275634765625, -1.087310791015625, -0.911865234375, -0.736419677734375, -0.56097412109375, -0.385528564453125, -0.2100830078125, -0.034637451171875, 0.14080810546875, 0.316253662109375, 0.49169921875, 0.667144775390625, 0.84259033203125, 1.018035888671875, 1.1934814453125, 1.368927001953125, 1.54437255859375, 1.719818115234375, 1.895263671875, 2.070709228515625, 2.24615478515625, 2.421600341796875, 2.5970458984375, 2.772491455078125, 2.94793701171875, 3.123382568359375, 3.298828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 17.0, 52.0, 176.0, 2418.0, 1230.0, 141.0, 29.0, 10.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7275390625, -1.6942520141601562, -1.6609649658203125, -1.6276779174804688, -1.594390869140625, -1.5611038208007812, -1.5278167724609375, -1.4945297241210938, -1.46124267578125, -1.4279556274414062, -1.3946685791015625, -1.3613815307617188, -1.328094482421875, -1.2948074340820312, -1.2615203857421875, -1.2282333374023438, -1.1949462890625, -1.1616592407226562, -1.1283721923828125, -1.0950851440429688, -1.061798095703125, -1.0285110473632812, -0.9952239990234375, -0.9619369506835938, -0.92864990234375, -0.8953628540039062, -0.8620758056640625, -0.8287887573242188, -0.795501708984375, -0.7622146606445312, -0.7289276123046875, -0.6956405639648438, -0.662353515625, -0.6290664672851562, -0.5957794189453125, -0.5624923706054688, -0.529205322265625, -0.49591827392578125, -0.4626312255859375, -0.42934417724609375, -0.39605712890625, -0.36277008056640625, -0.3294830322265625, -0.29619598388671875, -0.262908935546875, -0.22962188720703125, -0.1963348388671875, -0.16304779052734375, -0.1297607421875, -0.09647369384765625, -0.0631866455078125, -0.02989959716796875, 0.003387451171875, 0.03667449951171875, 0.0699615478515625, 0.10324859619140625, 0.13653564453125, 0.16982269287109375, 0.2031097412109375, 0.23639678955078125, 0.269683837890625, 0.30297088623046875, 0.3362579345703125, 0.36954498291015625, 0.40283203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 14.0, 22.0, 65.0, 185.0, 290.0, 253.0, 104.0, 37.0, 11.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.470098972320557, -5.325133323669434, -5.180168151855469, -5.035202503204346, -4.890236854553223, -4.745271682739258, -4.600306034088135, -4.455340385437012, -4.310375213623047, -4.165409564971924, -4.020444393157959, -3.875478744506836, -3.730513095855713, -3.585547685623169, -3.440582275390625, -3.295616626739502, -3.150650978088379, -3.005685567855835, -2.860719919204712, -2.715754508972168, -2.570788860321045, -2.425823450088501, -2.280858039855957, -2.135892391204834, -1.99092698097229, -1.8459614515304565, -1.700995922088623, -1.556030511856079, -1.4110649824142456, -1.266099452972412, -1.1211340427398682, -0.9761685132980347, -0.8312032222747803, -0.6862376928329468, -0.5412722229957581, -0.39630672335624695, -0.25134122371673584, -0.10637569427490234, 0.03858977556228638, 0.1835552453994751, 0.3285207748413086, 0.4734862744808197, 0.6184517741203308, 0.7634172439575195, 0.908382773399353, 1.0533483028411865, 1.1983137130737305, 1.343279242515564, 1.4882447719573975, 1.633210301399231, 1.7781758308410645, 1.9231412410736084, 2.0681066513061523, 2.2130722999572754, 2.3580377101898193, 2.5030031204223633, 2.6479687690734863, 2.7929341793060303, 2.9378998279571533, 3.0828652381896973, 3.2278308868408203, 3.3727962970733643, 3.517761707305908, 3.6627273559570312, 3.807692766189575]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 5.0, 7.0, 16.0, 22.0, 32.0, 35.0, 50.0, 53.0, 84.0, 66.0, 90.0, 80.0, 88.0, 64.0, 64.0, 59.0, 40.0, 45.0, 31.0, 26.0, 11.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3638198375701904, -2.2956786155700684, -2.2275376319885254, -2.1593964099884033, -2.0912551879882812, -2.0231142044067383, -1.9549729824066162, -1.8868317604064941, -1.8186906576156616, -1.750549554824829, -1.682408332824707, -1.6142672300338745, -1.546126127243042, -1.47798490524292, -1.4098438024520874, -1.3417026996612549, -1.2735614776611328, -1.2054203748703003, -1.1372791528701782, -1.0691380500793457, -1.0009968280792236, -0.9328557252883911, -0.8647146224975586, -0.7965734601020813, -0.728432297706604, -0.6602911353111267, -0.5921499729156494, -0.5240088701248169, -0.4558677077293396, -0.3877265453338623, -0.3195854127407074, -0.2514442801475525, -0.1833028793334961, -0.11516173183917999, -0.04702058434486389, 0.02112056314945221, 0.08926171064376831, 0.1574028730392456, 0.2255440056324005, 0.2936851382255554, 0.3618263006210327, 0.42996746301651, 0.4981085956096649, 0.5662497282028198, 0.6343908905982971, 0.7025320529937744, 0.7706731557846069, 0.8388143181800842, 0.9069554805755615, 0.9750966429710388, 1.0432378053665161, 1.1113789081573486, 1.1795201301574707, 1.2476612329483032, 1.3158023357391357, 1.3839435577392578, 1.4520846605300903, 1.5202257633209229, 1.588366985321045, 1.6565080881118774, 1.72464919090271, 1.792790412902832, 1.8609315156936646, 1.929072618484497, 1.9972138404846191]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 20.0, 34.0, 49.0, 73.0, 159.0, 310.0, 736.0, 2375.0, 16470.0, 560255.0, 450631.0, 13928.0, 2172.0, 717.0, 286.0, 146.0, 77.0, 37.0, 24.0, 17.0, 4.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.6666259765625, -2.559814453125, -2.4530029296875, -2.34619140625, -2.2393798828125, -2.132568359375, -2.0257568359375, -1.9189453125, -1.8121337890625, -1.705322265625, -1.5985107421875, -1.49169921875, -1.3848876953125, -1.278076171875, -1.1712646484375, -1.064453125, -0.9576416015625, -0.850830078125, -0.7440185546875, -0.63720703125, -0.5303955078125, -0.423583984375, -0.3167724609375, -0.2099609375, -0.1031494140625, 0.003662109375, 0.1104736328125, 0.21728515625, 0.3240966796875, 0.430908203125, 0.5377197265625, 0.64453125, 0.7513427734375, 0.858154296875, 0.9649658203125, 1.07177734375, 1.1785888671875, 1.285400390625, 1.3922119140625, 1.4990234375, 1.6058349609375, 1.712646484375, 1.8194580078125, 1.92626953125, 2.0330810546875, 2.139892578125, 2.2467041015625, 2.353515625, 2.4603271484375, 2.567138671875, 2.6739501953125, 2.78076171875, 2.8875732421875, 2.994384765625, 3.1011962890625, 3.2080078125, 3.3148193359375, 3.421630859375, 3.5284423828125, 3.63525390625, 3.7420654296875, 3.848876953125, 3.9556884765625, 4.0625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 13.0, 13.0, 23.0, 51.0, 51.0, 73.0, 73.0, 95.0, 110.0, 107.0, 102.0, 78.0, 61.0, 40.0, 38.0, 25.0, 18.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.40673828125, -0.3970069885253906, -0.38727569580078125, -0.3775444030761719, -0.3678131103515625, -0.3580818176269531, -0.34835052490234375, -0.3386192321777344, -0.328887939453125, -0.3191566467285156, -0.30942535400390625, -0.2996940612792969, -0.2899627685546875, -0.2802314758300781, -0.27050018310546875, -0.2607688903808594, -0.25103759765625, -0.24130630493164062, -0.23157501220703125, -0.22184371948242188, -0.2121124267578125, -0.20238113403320312, -0.19264984130859375, -0.18291854858398438, -0.173187255859375, -0.16345596313476562, -0.15372467041015625, -0.14399337768554688, -0.1342620849609375, -0.12453079223632812, -0.11479949951171875, -0.10506820678710938, -0.0953369140625, -0.08560562133789062, -0.07587432861328125, -0.06614303588867188, -0.0564117431640625, -0.046680450439453125, -0.03694915771484375, -0.027217864990234375, -0.017486572265625, -0.007755279541015625, 0.00197601318359375, 0.011707305908203125, 0.0214385986328125, 0.031169891357421875, 0.04090118408203125, 0.050632476806640625, 0.06036376953125, 0.07009506225585938, 0.07982635498046875, 0.08955764770507812, 0.0992889404296875, 0.10902023315429688, 0.11875152587890625, 0.12848281860351562, 0.138214111328125, 0.14794540405273438, 0.15767669677734375, 0.16740798950195312, 0.1771392822265625, 0.18687057495117188, 0.19660186767578125, 0.20633316040039062, 0.216064453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 17.0, 14.0, 30.0, 58.0, 85.0, 174.0, 339.0, 879.0, 2375.0, 8723.0, 63852.0, 743702.0, 205061.0, 17218.0, 3721.0, 1271.0, 521.0, 229.0, 106.0, 68.0, 29.0, 22.0, 9.0, 10.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.156707763671875, -2.09271240234375, -2.028717041015625, -1.9647216796875, -1.900726318359375, -1.83673095703125, -1.772735595703125, -1.708740234375, -1.644744873046875, -1.58074951171875, -1.516754150390625, -1.4527587890625, -1.388763427734375, -1.32476806640625, -1.260772705078125, -1.19677734375, -1.132781982421875, -1.06878662109375, -1.004791259765625, -0.9407958984375, -0.876800537109375, -0.81280517578125, -0.748809814453125, -0.684814453125, -0.620819091796875, -0.55682373046875, -0.492828369140625, -0.4288330078125, -0.364837646484375, -0.30084228515625, -0.236846923828125, -0.1728515625, -0.108856201171875, -0.04486083984375, 0.019134521484375, 0.0831298828125, 0.147125244140625, 0.21112060546875, 0.275115966796875, 0.339111328125, 0.403106689453125, 0.46710205078125, 0.531097412109375, 0.5950927734375, 0.659088134765625, 0.72308349609375, 0.787078857421875, 0.85107421875, 0.915069580078125, 0.97906494140625, 1.043060302734375, 1.1070556640625, 1.171051025390625, 1.23504638671875, 1.299041748046875, 1.363037109375, 1.427032470703125, 1.49102783203125, 1.555023193359375, 1.6190185546875, 1.683013916015625, 1.74700927734375, 1.811004638671875, 1.875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 7.0, 8.0, 9.0, 22.0, 28.0, 31.0, 37.0, 41.0, 53.0, 68.0, 71.0, 59.0, 72.0, 83.0, 80.0, 69.0, 47.0, 50.0, 37.0, 30.0, 20.0, 22.0, 19.0, 11.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.240234375, -1.2054824829101562, -1.1707305908203125, -1.1359786987304688, -1.101226806640625, -1.0664749145507812, -1.0317230224609375, -0.9969711303710938, -0.96221923828125, -0.9274673461914062, -0.8927154541015625, -0.8579635620117188, -0.823211669921875, -0.7884597778320312, -0.7537078857421875, -0.7189559936523438, -0.6842041015625, -0.6494522094726562, -0.6147003173828125, -0.5799484252929688, -0.545196533203125, -0.5104446411132812, -0.4756927490234375, -0.44094085693359375, -0.40618896484375, -0.37143707275390625, -0.3366851806640625, -0.30193328857421875, -0.267181396484375, -0.23242950439453125, -0.1976776123046875, -0.16292572021484375, -0.128173828125, -0.09342193603515625, -0.0586700439453125, -0.02391815185546875, 0.010833740234375, 0.04558563232421875, 0.0803375244140625, 0.11508941650390625, 0.14984130859375, 0.18459320068359375, 0.2193450927734375, 0.25409698486328125, 0.288848876953125, 0.32360076904296875, 0.3583526611328125, 0.39310455322265625, 0.4278564453125, 0.46260833740234375, 0.4973602294921875, 0.5321121215820312, 0.566864013671875, 0.6016159057617188, 0.6363677978515625, 0.6711196899414062, 0.70587158203125, 0.7406234741210938, 0.7753753662109375, 0.8101272583007812, 0.844879150390625, 0.8796310424804688, 0.9143829345703125, 0.9491348266601562, 0.98388671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 3.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 35.0, 41.0, 47.0, 84.0, 160.0, 252.0, 415.0, 729.0, 1386.0, 2867.0, 7451.0, 23423.0, 106552.0, 497975.0, 323975.0, 58314.0, 14798.0, 5224.0, 2198.0, 1033.0, 563.0, 338.0, 189.0, 134.0, 97.0, 53.0, 40.0, 24.0, 23.0, 17.0, 12.0, 7.0, 10.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.6044921875, -0.587615966796875, -0.57073974609375, -0.553863525390625, -0.5369873046875, -0.520111083984375, -0.50323486328125, -0.486358642578125, -0.469482421875, -0.452606201171875, -0.43572998046875, -0.418853759765625, -0.4019775390625, -0.385101318359375, -0.36822509765625, -0.351348876953125, -0.33447265625, -0.317596435546875, -0.30072021484375, -0.283843994140625, -0.2669677734375, -0.250091552734375, -0.23321533203125, -0.216339111328125, -0.199462890625, -0.182586669921875, -0.16571044921875, -0.148834228515625, -0.1319580078125, -0.115081787109375, -0.09820556640625, -0.081329345703125, -0.064453125, -0.047576904296875, -0.03070068359375, -0.013824462890625, 0.0030517578125, 0.019927978515625, 0.03680419921875, 0.053680419921875, 0.070556640625, 0.087432861328125, 0.10430908203125, 0.121185302734375, 0.1380615234375, 0.154937744140625, 0.17181396484375, 0.188690185546875, 0.20556640625, 0.222442626953125, 0.23931884765625, 0.256195068359375, 0.2730712890625, 0.289947509765625, 0.30682373046875, 0.323699951171875, 0.340576171875, 0.357452392578125, 0.37432861328125, 0.391204833984375, 0.4080810546875, 0.424957275390625, 0.44183349609375, 0.458709716796875, 0.4755859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 6.0, 5.0, 15.0, 12.0, 26.0, 26.0, 46.0, 47.0, 70.0, 91.0, 117.0, 127.0, 125.0, 83.0, 48.0, 44.0, 39.0, 23.0, 23.0, 6.0, 4.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00017011165618896484, -0.00016617868095636368, -0.0001622457057237625, -0.00015831273049116135, -0.00015437975525856018, -0.00015044678002595901, -0.00014651380479335785, -0.00014258082956075668, -0.00013864785432815552, -0.00013471487909555435, -0.00013078190386295319, -0.00012684892863035202, -0.00012291595339775085, -0.00011898297816514969, -0.00011505000293254852, -0.00011111702769994736, -0.00010718405246734619, -0.00010325107723474503, -9.931810200214386e-05, -9.53851267695427e-05, -9.145215153694153e-05, -8.751917630434036e-05, -8.35862010717392e-05, -7.965322583913803e-05, -7.572025060653687e-05, -7.17872753739357e-05, -6.785430014133453e-05, -6.392132490873337e-05, -5.99883496761322e-05, -5.6055374443531036e-05, -5.212239921092987e-05, -4.8189423978328705e-05, -4.425644874572754e-05, -4.032347351312637e-05, -3.639049828052521e-05, -3.245752304792404e-05, -2.8524547815322876e-05, -2.459157258272171e-05, -2.0658597350120544e-05, -1.672562211751938e-05, -1.2792646884918213e-05, -8.859671652317047e-06, -4.926696419715881e-06, -9.937211871147156e-07, 2.93925404548645e-06, 6.872229278087616e-06, 1.0805204510688782e-05, 1.4738179743289948e-05, 1.8671154975891113e-05, 2.260413020849228e-05, 2.6537105441093445e-05, 3.047008067369461e-05, 3.4403055906295776e-05, 3.833603113889694e-05, 4.226900637149811e-05, 4.6201981604099274e-05, 5.013495683670044e-05, 5.4067932069301605e-05, 5.800090730190277e-05, 6.193388253450394e-05, 6.58668577671051e-05, 6.979983299970627e-05, 7.373280823230743e-05, 7.76657834649086e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 3.0, 13.0, 18.0, 40.0, 81.0, 122.0, 259.0, 428.0, 1019.0, 2616.0, 8315.0, 36580.0, 275942.0, 596525.0, 101745.0, 17181.0, 4627.0, 1637.0, 646.0, 327.0, 143.0, 89.0, 55.0, 38.0, 25.0, 16.0, 9.0, 11.0, 13.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6865081787109375, -0.666473388671875, -0.6464385986328125, -0.62640380859375, -0.6063690185546875, -0.586334228515625, -0.5662994384765625, -0.5462646484375, -0.5262298583984375, -0.506195068359375, -0.4861602783203125, -0.46612548828125, -0.4460906982421875, -0.426055908203125, -0.4060211181640625, -0.385986328125, -0.3659515380859375, -0.345916748046875, -0.3258819580078125, -0.30584716796875, -0.2858123779296875, -0.265777587890625, -0.2457427978515625, -0.2257080078125, -0.2056732177734375, -0.185638427734375, -0.1656036376953125, -0.14556884765625, -0.1255340576171875, -0.105499267578125, -0.0854644775390625, -0.0654296875, -0.0453948974609375, -0.025360107421875, -0.0053253173828125, 0.01470947265625, 0.0347442626953125, 0.054779052734375, 0.0748138427734375, 0.0948486328125, 0.1148834228515625, 0.134918212890625, 0.1549530029296875, 0.17498779296875, 0.1950225830078125, 0.215057373046875, 0.2350921630859375, 0.255126953125, 0.2751617431640625, 0.295196533203125, 0.3152313232421875, 0.33526611328125, 0.3553009033203125, 0.375335693359375, 0.3953704833984375, 0.4154052734375, 0.4354400634765625, 0.455474853515625, 0.4755096435546875, 0.49554443359375, 0.5155792236328125, 0.535614013671875, 0.5556488037109375, 0.57568359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 12.0, 10.0, 14.0, 26.0, 23.0, 34.0, 68.0, 73.0, 119.0, 120.0, 111.0, 92.0, 79.0, 63.0, 41.0, 32.0, 24.0, 8.0, 14.0, 6.0, 10.0, 4.0, 3.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.57470703125, -0.5596199035644531, -0.5445327758789062, -0.5294456481933594, -0.5143585205078125, -0.4992713928222656, -0.48418426513671875, -0.4690971374511719, -0.454010009765625, -0.4389228820800781, -0.42383575439453125, -0.4087486267089844, -0.3936614990234375, -0.3785743713378906, -0.36348724365234375, -0.3484001159667969, -0.33331298828125, -0.3182258605957031, -0.30313873291015625, -0.2880516052246094, -0.2729644775390625, -0.2578773498535156, -0.24279022216796875, -0.22770309448242188, -0.212615966796875, -0.19752883911132812, -0.18244171142578125, -0.16735458374023438, -0.1522674560546875, -0.13718032836914062, -0.12209320068359375, -0.10700607299804688, -0.0919189453125, -0.07683181762695312, -0.06174468994140625, -0.046657562255859375, -0.0315704345703125, -0.016483306884765625, -0.00139617919921875, 0.013690948486328125, 0.028778076171875, 0.043865203857421875, 0.05895233154296875, 0.07403945922851562, 0.0891265869140625, 0.10421371459960938, 0.11930084228515625, 0.13438796997070312, 0.14947509765625, 0.16456222534179688, 0.17964935302734375, 0.19473648071289062, 0.2098236083984375, 0.22491073608398438, 0.23999786376953125, 0.2550849914550781, 0.270172119140625, 0.2852592468261719, 0.30034637451171875, 0.3154335021972656, 0.3305206298828125, 0.3456077575683594, 0.36069488525390625, 0.3757820129394531, 0.390869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 19.0, 16.0, 46.0, 86.0, 135.0, 204.0, 183.0, 126.0, 62.0, 52.0, 29.0, 23.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.175352096557617, -11.8909912109375, -11.6066312789917, -11.322270393371582, -11.037910461425781, -10.753549575805664, -10.469188690185547, -10.184828758239746, -9.900467872619629, -9.616106986999512, -9.331747055053711, -9.047386169433594, -8.763026237487793, -8.478665351867676, -8.194305419921875, -7.909944534301758, -7.625584125518799, -7.34122371673584, -7.056863307952881, -6.772502899169922, -6.488142013549805, -6.203781604766846, -5.919421195983887, -5.635060787200928, -5.350700378417969, -5.06633996963501, -4.781979560852051, -4.497618675231934, -4.213258266448975, -3.9288978576660156, -3.6445374488830566, -3.3601770401000977, -3.0758161544799805, -2.7914557456970215, -2.5070950984954834, -2.2227346897125244, -1.9383741617202759, -1.6540136337280273, -1.3696532249450684, -1.0852926969528198, -0.8009321689605713, -0.5165716409683228, -0.232211172580719, 0.052149295806884766, 0.3365098237991333, 0.6208703517913818, 0.9052307605743408, 1.1895912885665894, 1.473951816558838, 1.7583123445510864, 2.042672872543335, 2.327033281326294, 2.611393928527832, 2.895754337310791, 3.18011474609375, 3.464475154876709, 3.748835802078247, 4.033196449279785, 4.317556858062744, 4.601917266845703, 4.886277675628662, 5.170638084411621, 5.454998970031738, 5.739359378814697, 6.023719787597656]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 10.0, 6.0, 8.0, 15.0, 11.0, 20.0, 15.0, 18.0, 24.0, 27.0, 46.0, 42.0, 42.0, 39.0, 53.0, 60.0, 48.0, 50.0, 40.0, 61.0, 47.0, 40.0, 40.0, 34.0, 32.0, 30.0, 24.0, 20.0, 12.0, 21.0, 12.0, 12.0, 10.0, 3.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.770001411437988, -4.629631042480469, -4.489260673522949, -4.34889030456543, -4.20851993560791, -4.068149566650391, -3.92777943611145, -3.7874090671539307, -3.647038698196411, -3.5066683292388916, -3.366297960281372, -3.2259275913238525, -3.085557460784912, -2.9451870918273926, -2.804816722869873, -2.6644463539123535, -2.524075984954834, -2.3837056159973145, -2.243335247039795, -2.1029648780822754, -1.9625946283340454, -1.8222242593765259, -1.681854009628296, -1.5414836406707764, -1.4011132717132568, -1.2607429027557373, -1.1203725337982178, -0.9800022840499878, -0.8396319150924683, -0.6992615461349487, -0.558891236782074, -0.4185209274291992, -0.2781505584716797, -0.13778021931648254, 0.0025901198387145996, 0.14296045899391174, 0.2833307981491089, 0.4237011671066284, 0.5640714764595032, 0.7044417858123779, 0.8448121547698975, 0.985182523727417, 1.1255528926849365, 1.2659231424331665, 1.406293511390686, 1.5466638803482056, 1.6870341300964355, 1.827404499053955, 1.9677748680114746, 2.108145236968994, 2.2485156059265137, 2.388885974884033, 2.5292563438415527, 2.6696267127990723, 2.8099968433380127, 2.9503672122955322, 3.0907375812530518, 3.2311079502105713, 3.371478319168091, 3.5118486881256104, 3.652218818664551, 3.7925891876220703, 3.93295955657959, 4.073329925537109, 4.213700294494629]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 4.0, 2.0, 10.0, 11.0, 12.0, 15.0, 18.0, 21.0, 20.0, 30.0, 36.0, 52.0, 47.0, 49.0, 79.0, 98.0, 143.0, 160.0, 232.0, 384.0, 710.0, 1235.0, 2823.0, 7460.0, 24687.0, 135258.0, 3723051.0, 245676.0, 35410.0, 10100.0, 3564.0, 1433.0, 695.0, 340.0, 172.0, 92.0, 60.0, 33.0, 21.0, 10.0, 10.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.91796875, -2.8525543212890625, -2.787139892578125, -2.7217254638671875, -2.65631103515625, -2.5908966064453125, -2.525482177734375, -2.4600677490234375, -2.3946533203125, -2.3292388916015625, -2.263824462890625, -2.1984100341796875, -2.13299560546875, -2.0675811767578125, -2.002166748046875, -1.9367523193359375, -1.871337890625, -1.8059234619140625, -1.740509033203125, -1.6750946044921875, -1.60968017578125, -1.5442657470703125, -1.478851318359375, -1.4134368896484375, -1.3480224609375, -1.2826080322265625, -1.217193603515625, -1.1517791748046875, -1.08636474609375, -1.0209503173828125, -0.955535888671875, -0.8901214599609375, -0.82470703125, -0.7592926025390625, -0.693878173828125, -0.6284637451171875, -0.56304931640625, -0.4976348876953125, -0.432220458984375, -0.3668060302734375, -0.3013916015625, -0.2359771728515625, -0.170562744140625, -0.1051483154296875, -0.03973388671875, 0.0256805419921875, 0.091094970703125, 0.1565093994140625, 0.221923828125, 0.2873382568359375, 0.352752685546875, 0.4181671142578125, 0.48358154296875, 0.5489959716796875, 0.614410400390625, 0.6798248291015625, 0.7452392578125, 0.8106536865234375, 0.876068115234375, 0.9414825439453125, 1.00689697265625, 1.0723114013671875, 1.137725830078125, 1.2031402587890625, 1.2685546875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 20.0, 25.0, 34.0, 52.0, 68.0, 64.0, 100.0, 109.0, 102.0, 109.0, 86.0, 64.0, 50.0, 40.0, 30.0, 13.0, 2.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.42444419860839844, -0.4143180847167969, -0.4041919708251953, -0.39406585693359375, -0.3839397430419922, -0.3738136291503906, -0.36368751525878906, -0.3535614013671875, -0.34343528747558594, -0.3333091735839844, -0.3231830596923828, -0.31305694580078125, -0.3029308319091797, -0.2928047180175781, -0.28267860412597656, -0.272552490234375, -0.26242637634277344, -0.2523002624511719, -0.2421741485595703, -0.23204803466796875, -0.2219219207763672, -0.21179580688476562, -0.20166969299316406, -0.1915435791015625, -0.18141746520996094, -0.17129135131835938, -0.1611652374267578, -0.15103912353515625, -0.1409130096435547, -0.13078689575195312, -0.12066078186035156, -0.11053466796875, -0.10040855407714844, -0.09028244018554688, -0.08015632629394531, -0.07003021240234375, -0.05990409851074219, -0.049777984619140625, -0.03965187072753906, -0.0295257568359375, -0.019399642944335938, -0.009273529052734375, 0.0008525848388671875, 0.01097869873046875, 0.021104812622070312, 0.031230926513671875, 0.04135704040527344, 0.051483154296875, 0.06160926818847656, 0.07173538208007812, 0.08186149597167969, 0.09198760986328125, 0.10211372375488281, 0.11223983764648438, 0.12236595153808594, 0.1324920654296875, 0.14261817932128906, 0.15274429321289062, 0.1628704071044922, 0.17299652099609375, 0.1831226348876953, 0.19324874877929688, 0.20337486267089844, 0.2135009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 7.0, 13.0, 31.0, 78.0, 146.0, 294.0, 1088.0, 9091.0, 4153450.0, 27882.0, 1546.0, 381.0, 146.0, 67.0, 30.0, 16.0, 11.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.9117431640625, -11.557861328125, -11.2039794921875, -10.85009765625, -10.4962158203125, -10.142333984375, -9.7884521484375, -9.4345703125, -9.0806884765625, -8.726806640625, -8.3729248046875, -8.01904296875, -7.6651611328125, -7.311279296875, -6.9573974609375, -6.603515625, -6.2496337890625, -5.895751953125, -5.5418701171875, -5.18798828125, -4.8341064453125, -4.480224609375, -4.1263427734375, -3.7724609375, -3.4185791015625, -3.064697265625, -2.7108154296875, -2.35693359375, -2.0030517578125, -1.649169921875, -1.2952880859375, -0.94140625, -0.5875244140625, -0.233642578125, 0.1202392578125, 0.47412109375, 0.8280029296875, 1.181884765625, 1.5357666015625, 1.8896484375, 2.2435302734375, 2.597412109375, 2.9512939453125, 3.30517578125, 3.6590576171875, 4.012939453125, 4.3668212890625, 4.720703125, 5.0745849609375, 5.428466796875, 5.7823486328125, 6.13623046875, 6.4901123046875, 6.843994140625, 7.1978759765625, 7.5517578125, 7.9056396484375, 8.259521484375, 8.6134033203125, 8.96728515625, 9.3211669921875, 9.675048828125, 10.0289306640625, 10.3828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 9.0, 9.0, 11.0, 20.0, 42.0, 197.0, 2614.0, 1006.0, 111.0, 31.0, 11.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.255523681640625, -2.18682861328125, -2.118133544921875, -2.0494384765625, -1.980743408203125, -1.91204833984375, -1.843353271484375, -1.774658203125, -1.705963134765625, -1.63726806640625, -1.568572998046875, -1.4998779296875, -1.431182861328125, -1.36248779296875, -1.293792724609375, -1.22509765625, -1.156402587890625, -1.08770751953125, -1.019012451171875, -0.9503173828125, -0.881622314453125, -0.81292724609375, -0.744232177734375, -0.675537109375, -0.606842041015625, -0.53814697265625, -0.469451904296875, -0.4007568359375, -0.332061767578125, -0.26336669921875, -0.194671630859375, -0.1259765625, -0.057281494140625, 0.01141357421875, 0.080108642578125, 0.1488037109375, 0.217498779296875, 0.28619384765625, 0.354888916015625, 0.423583984375, 0.492279052734375, 0.56097412109375, 0.629669189453125, 0.6983642578125, 0.767059326171875, 0.83575439453125, 0.904449462890625, 0.97314453125, 1.041839599609375, 1.11053466796875, 1.179229736328125, 1.2479248046875, 1.316619873046875, 1.38531494140625, 1.454010009765625, 1.522705078125, 1.591400146484375, 1.66009521484375, 1.728790283203125, 1.7974853515625, 1.866180419921875, 1.93487548828125, 2.003570556640625, 2.072265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 12.0, 47.0, 208.0, 500.0, 188.0, 36.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.29140281677246, -23.809968948364258, -23.328535079956055, -22.84710121154785, -22.36566734313965, -21.884233474731445, -21.402799606323242, -20.92136573791504, -20.439931869506836, -19.958498001098633, -19.47706413269043, -18.995630264282227, -18.514196395874023, -18.03276252746582, -17.551328659057617, -17.069894790649414, -16.58846092224121, -16.107027053833008, -15.625593185424805, -15.144159317016602, -14.662725448608398, -14.181291580200195, -13.699857711791992, -13.218423843383789, -12.736989974975586, -12.255556106567383, -11.77412223815918, -11.292688369750977, -10.811254501342773, -10.32982063293457, -9.848386764526367, -9.366952896118164, -8.885518074035645, -8.404084205627441, -7.922650337219238, -7.441216468811035, -6.959782600402832, -6.478348731994629, -5.996914863586426, -5.515480995178223, -5.0340471267700195, -4.552613258361816, -4.071179389953613, -3.58974552154541, -3.108311653137207, -2.626877784729004, -2.145443916320801, -1.6640100479125977, -1.1825761795043945, -0.7011423110961914, -0.21970844268798828, 0.26172542572021484, 0.743159294128418, 1.224593162536621, 1.7060270309448242, 2.1874608993530273, 2.6688947677612305, 3.1503286361694336, 3.6317625045776367, 4.11319637298584, 4.594630241394043, 5.076064109802246, 5.557497978210449, 6.038931846618652, 6.5203657150268555]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 0.0, 6.0, 7.0, 10.0, 13.0, 35.0, 48.0, 72.0, 82.0, 94.0, 100.0, 100.0, 93.0, 77.0, 84.0, 61.0, 39.0, 22.0, 24.0, 13.0, 14.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.191410064697266, -4.041649341583252, -3.8918888568878174, -3.7421281337738037, -3.592367649078369, -3.4426069259643555, -3.292846202850342, -3.1430857181549072, -2.9933252334594727, -2.843564510345459, -2.6938040256500244, -2.5440433025360107, -2.394282817840576, -2.2445220947265625, -2.094761371612549, -1.9450008869171143, -1.7952401638031006, -1.6454795598983765, -1.4957189559936523, -1.3459582328796387, -1.196197748184204, -1.0464370250701904, -0.8966764211654663, -0.7469158172607422, -0.5971552133560181, -0.44739460945129395, -0.29763397574424744, -0.14787334203720093, 0.0018872618675231934, 0.15164786577224731, 0.3014085292816162, 0.45116913318634033, 0.6009297370910645, 0.7506903409957886, 0.9004509449005127, 1.0502116680145264, 1.199972152709961, 1.3497328758239746, 1.4994934797286987, 1.6492540836334229, 1.799014687538147, 1.948775291442871, 2.0985360145568848, 2.2482964992523193, 2.398057222366333, 2.5478177070617676, 2.6975784301757812, 2.847339153289795, 2.9970996379852295, 3.146860361099243, 3.2966208457946777, 3.4463815689086914, 3.596142053604126, 3.7459027767181396, 3.895663261413574, 4.045423984527588, 4.195184707641602, 4.344945430755615, 4.494706153869629, 4.644466400146484, 4.794227123260498, 4.943987846374512, 5.093748569488525, 5.243509292602539, 5.3932695388793945]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 7.0, 8.0, 6.0, 6.0, 11.0, 8.0, 11.0, 22.0, 28.0, 47.0, 62.0, 92.0, 132.0, 196.0, 303.0, 522.0, 980.0, 2213.0, 6578.0, 26310.0, 168298.0, 633333.0, 171528.0, 26481.0, 6655.0, 2334.0, 1025.0, 496.0, 265.0, 194.0, 113.0, 88.0, 44.0, 39.0, 34.0, 19.0, 10.0, 12.0, 9.0, 6.0, 12.0, 5.0, 2.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.87109375, -1.81524658203125, -1.7593994140625, -1.70355224609375, -1.647705078125, -1.59185791015625, -1.5360107421875, -1.48016357421875, -1.42431640625, -1.36846923828125, -1.3126220703125, -1.25677490234375, -1.200927734375, -1.14508056640625, -1.0892333984375, -1.03338623046875, -0.9775390625, -0.92169189453125, -0.8658447265625, -0.80999755859375, -0.754150390625, -0.69830322265625, -0.6424560546875, -0.58660888671875, -0.53076171875, -0.47491455078125, -0.4190673828125, -0.36322021484375, -0.307373046875, -0.25152587890625, -0.1956787109375, -0.13983154296875, -0.083984375, -0.02813720703125, 0.0277099609375, 0.08355712890625, 0.139404296875, 0.19525146484375, 0.2510986328125, 0.30694580078125, 0.36279296875, 0.41864013671875, 0.4744873046875, 0.53033447265625, 0.586181640625, 0.64202880859375, 0.6978759765625, 0.75372314453125, 0.8095703125, 0.86541748046875, 0.9212646484375, 0.97711181640625, 1.032958984375, 1.08880615234375, 1.1446533203125, 1.20050048828125, 1.25634765625, 1.31219482421875, 1.3680419921875, 1.42388916015625, 1.479736328125, 1.53558349609375, 1.5914306640625, 1.64727783203125, 1.703125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 15.0, 23.0, 17.0, 51.0, 69.0, 79.0, 102.0, 85.0, 115.0, 90.0, 94.0, 82.0, 53.0, 41.0, 29.0, 17.0, 9.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.44677734375, -0.4356727600097656, -0.42456817626953125, -0.4134635925292969, -0.4023590087890625, -0.3912544250488281, -0.38014984130859375, -0.3690452575683594, -0.357940673828125, -0.3468360900878906, -0.33573150634765625, -0.3246269226074219, -0.3135223388671875, -0.3024177551269531, -0.29131317138671875, -0.2802085876464844, -0.26910400390625, -0.2579994201660156, -0.24689483642578125, -0.23579025268554688, -0.2246856689453125, -0.21358108520507812, -0.20247650146484375, -0.19137191772460938, -0.180267333984375, -0.16916275024414062, -0.15805816650390625, -0.14695358276367188, -0.1358489990234375, -0.12474441528320312, -0.11363983154296875, -0.10253524780273438, -0.0914306640625, -0.08032608032226562, -0.06922149658203125, -0.058116912841796875, -0.0470123291015625, -0.035907745361328125, -0.02480316162109375, -0.013698577880859375, -0.002593994140625, 0.008510589599609375, 0.01961517333984375, 0.030719757080078125, 0.0418243408203125, 0.052928924560546875, 0.06403350830078125, 0.07513809204101562, 0.08624267578125, 0.09734725952148438, 0.10845184326171875, 0.11955642700195312, 0.1306610107421875, 0.14176559448242188, 0.15287017822265625, 0.16397476196289062, 0.175079345703125, 0.18618392944335938, 0.19728851318359375, 0.20839309692382812, 0.2194976806640625, 0.23060226440429688, 0.24170684814453125, 0.2528114318847656, 0.263916015625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 13.0, 20.0, 36.0, 39.0, 74.0, 133.0, 269.0, 669.0, 1708.0, 6191.0, 29036.0, 173133.0, 571332.0, 219030.0, 36180.0, 7260.0, 2006.0, 745.0, 297.0, 144.0, 67.0, 44.0, 23.0, 26.0, 10.0, 14.0, 12.0, 2.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0560760498046875, -1.020355224609375, -0.9846343994140625, -0.94891357421875, -0.9131927490234375, -0.877471923828125, -0.8417510986328125, -0.8060302734375, -0.7703094482421875, -0.734588623046875, -0.6988677978515625, -0.66314697265625, -0.6274261474609375, -0.591705322265625, -0.5559844970703125, -0.520263671875, -0.4845428466796875, -0.448822021484375, -0.4131011962890625, -0.37738037109375, -0.3416595458984375, -0.305938720703125, -0.2702178955078125, -0.2344970703125, -0.1987762451171875, -0.163055419921875, -0.1273345947265625, -0.09161376953125, -0.0558929443359375, -0.020172119140625, 0.0155487060546875, 0.05126953125, 0.0869903564453125, 0.122711181640625, 0.1584320068359375, 0.19415283203125, 0.2298736572265625, 0.265594482421875, 0.3013153076171875, 0.3370361328125, 0.3727569580078125, 0.408477783203125, 0.4441986083984375, 0.47991943359375, 0.5156402587890625, 0.551361083984375, 0.5870819091796875, 0.622802734375, 0.6585235595703125, 0.694244384765625, 0.7299652099609375, 0.76568603515625, 0.8014068603515625, 0.837127685546875, 0.8728485107421875, 0.9085693359375, 0.9442901611328125, 0.980010986328125, 1.0157318115234375, 1.05145263671875, 1.0871734619140625, 1.122894287109375, 1.1586151123046875, 1.1943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 12.0, 14.0, 19.0, 9.0, 25.0, 26.0, 31.0, 36.0, 40.0, 38.0, 39.0, 35.0, 51.0, 54.0, 44.0, 61.0, 51.0, 47.0, 46.0, 34.0, 48.0, 29.0, 43.0, 23.0, 19.0, 27.0, 18.0, 20.0, 9.0, 9.0, 5.0, 9.0, 8.0, 2.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6781005859375, -0.655029296875, -0.6319580078125, -0.60888671875, -0.5858154296875, -0.562744140625, -0.5396728515625, -0.5166015625, -0.4935302734375, -0.470458984375, -0.4473876953125, -0.42431640625, -0.4012451171875, -0.378173828125, -0.3551025390625, -0.33203125, -0.3089599609375, -0.285888671875, -0.2628173828125, -0.23974609375, -0.2166748046875, -0.193603515625, -0.1705322265625, -0.1474609375, -0.1243896484375, -0.101318359375, -0.0782470703125, -0.05517578125, -0.0321044921875, -0.009033203125, 0.0140380859375, 0.037109375, 0.0601806640625, 0.083251953125, 0.1063232421875, 0.12939453125, 0.1524658203125, 0.175537109375, 0.1986083984375, 0.2216796875, 0.2447509765625, 0.267822265625, 0.2908935546875, 0.31396484375, 0.3370361328125, 0.360107421875, 0.3831787109375, 0.40625, 0.4293212890625, 0.452392578125, 0.4754638671875, 0.49853515625, 0.5216064453125, 0.544677734375, 0.5677490234375, 0.5908203125, 0.6138916015625, 0.636962890625, 0.6600341796875, 0.68310546875, 0.7061767578125, 0.729248046875, 0.7523193359375, 0.775390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 12.0, 17.0, 24.0, 47.0, 78.0, 124.0, 228.0, 539.0, 1280.0, 4799.0, 30497.0, 387699.0, 564677.0, 49008.0, 6633.0, 1675.0, 614.0, 270.0, 162.0, 60.0, 41.0, 20.0, 12.0, 12.0, 10.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6601104736328125, -0.632720947265625, -0.6053314208984375, -0.57794189453125, -0.5505523681640625, -0.523162841796875, -0.4957733154296875, -0.4683837890625, -0.4409942626953125, -0.413604736328125, -0.3862152099609375, -0.35882568359375, -0.3314361572265625, -0.304046630859375, -0.2766571044921875, -0.249267578125, -0.2218780517578125, -0.194488525390625, -0.1670989990234375, -0.13970947265625, -0.1123199462890625, -0.084930419921875, -0.0575408935546875, -0.0301513671875, -0.0027618408203125, 0.024627685546875, 0.0520172119140625, 0.07940673828125, 0.1067962646484375, 0.134185791015625, 0.1615753173828125, 0.18896484375, 0.2163543701171875, 0.243743896484375, 0.2711334228515625, 0.29852294921875, 0.3259124755859375, 0.353302001953125, 0.3806915283203125, 0.4080810546875, 0.4354705810546875, 0.462860107421875, 0.4902496337890625, 0.51763916015625, 0.5450286865234375, 0.572418212890625, 0.5998077392578125, 0.627197265625, 0.6545867919921875, 0.681976318359375, 0.7093658447265625, 0.73675537109375, 0.7641448974609375, 0.791534423828125, 0.8189239501953125, 0.8463134765625, 0.8737030029296875, 0.901092529296875, 0.9284820556640625, 0.95587158203125, 0.9832611083984375, 1.010650634765625, 1.0380401611328125, 1.0654296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 20.0, 10.0, 22.0, 40.0, 62.0, 87.0, 97.0, 130.0, 152.0, 111.0, 98.0, 47.0, 42.0, 32.0, 14.0, 8.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00011979788541793823, -0.0001153796911239624, -0.00011096149682998657, -0.00010654330253601074, -0.00010212510824203491, -9.770691394805908e-05, -9.328871965408325e-05, -8.887052536010742e-05, -8.445233106613159e-05, -8.003413677215576e-05, -7.561594247817993e-05, -7.11977481842041e-05, -6.677955389022827e-05, -6.236135959625244e-05, -5.794316530227661e-05, -5.352497100830078e-05, -4.910677671432495e-05, -4.468858242034912e-05, -4.027038812637329e-05, -3.585219383239746e-05, -3.143399953842163e-05, -2.70158052444458e-05, -2.259761095046997e-05, -1.817941665649414e-05, -1.376122236251831e-05, -9.34302806854248e-06, -4.92483377456665e-06, -5.066394805908203e-07, 3.91155481338501e-06, 8.32974910736084e-06, 1.274794340133667e-05, 1.71661376953125e-05, 2.158433198928833e-05, 2.600252628326416e-05, 3.042072057723999e-05, 3.483891487121582e-05, 3.925710916519165e-05, 4.367530345916748e-05, 4.809349775314331e-05, 5.251169204711914e-05, 5.692988634109497e-05, 6.13480806350708e-05, 6.576627492904663e-05, 7.018446922302246e-05, 7.460266351699829e-05, 7.902085781097412e-05, 8.343905210494995e-05, 8.785724639892578e-05, 9.227544069290161e-05, 9.669363498687744e-05, 0.00010111182928085327, 0.0001055300235748291, 0.00010994821786880493, 0.00011436641216278076, 0.00011878460645675659, 0.00012320280075073242, 0.00012762099504470825, 0.00013203918933868408, 0.0001364573836326599, 0.00014087557792663574, 0.00014529377222061157, 0.0001497119665145874, 0.00015413016080856323, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 10.0, 7.0, 19.0, 15.0, 27.0, 52.0, 89.0, 215.0, 533.0, 2242.0, 12495.0, 133208.0, 756807.0, 127950.0, 11892.0, 2014.0, 558.0, 177.0, 84.0, 54.0, 34.0, 26.0, 18.0, 8.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.503997802734375, -0.47674560546875, -0.449493408203125, -0.4222412109375, -0.394989013671875, -0.36773681640625, -0.340484619140625, -0.313232421875, -0.285980224609375, -0.25872802734375, -0.231475830078125, -0.2042236328125, -0.176971435546875, -0.14971923828125, -0.122467041015625, -0.09521484375, -0.067962646484375, -0.04071044921875, -0.013458251953125, 0.0137939453125, 0.041046142578125, 0.06829833984375, 0.095550537109375, 0.122802734375, 0.150054931640625, 0.17730712890625, 0.204559326171875, 0.2318115234375, 0.259063720703125, 0.28631591796875, 0.313568115234375, 0.3408203125, 0.368072509765625, 0.39532470703125, 0.422576904296875, 0.4498291015625, 0.477081298828125, 0.50433349609375, 0.531585693359375, 0.558837890625, 0.586090087890625, 0.61334228515625, 0.640594482421875, 0.6678466796875, 0.695098876953125, 0.72235107421875, 0.749603271484375, 0.77685546875, 0.804107666015625, 0.83135986328125, 0.858612060546875, 0.8858642578125, 0.913116455078125, 0.94036865234375, 0.967620849609375, 0.994873046875, 1.022125244140625, 1.04937744140625, 1.076629638671875, 1.1038818359375, 1.131134033203125, 1.15838623046875, 1.185638427734375, 1.212890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 9.0, 12.0, 15.0, 20.0, 34.0, 41.0, 64.0, 52.0, 71.0, 100.0, 92.0, 77.0, 73.0, 66.0, 61.0, 52.0, 35.0, 19.0, 21.0, 17.0, 14.0, 11.0, 6.0, 6.0, 2.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23076820373535156, -0.21947097778320312, -0.2081737518310547, -0.19687652587890625, -0.1855792999267578, -0.17428207397460938, -0.16298484802246094, -0.1516876220703125, -0.14039039611816406, -0.12909317016601562, -0.11779594421386719, -0.10649871826171875, -0.09520149230957031, -0.08390426635742188, -0.07260704040527344, -0.061309814453125, -0.05001258850097656, -0.038715362548828125, -0.027418136596679688, -0.01612091064453125, -0.0048236846923828125, 0.006473541259765625, 0.017770767211914062, 0.0290679931640625, 0.04036521911621094, 0.051662445068359375, 0.06295967102050781, 0.07425689697265625, 0.08555412292480469, 0.09685134887695312, 0.10814857482910156, 0.11944580078125, 0.13074302673339844, 0.14204025268554688, 0.1533374786376953, 0.16463470458984375, 0.1759319305419922, 0.18722915649414062, 0.19852638244628906, 0.2098236083984375, 0.22112083435058594, 0.23241806030273438, 0.2437152862548828, 0.25501251220703125, 0.2663097381591797, 0.2776069641113281, 0.28890419006347656, 0.300201416015625, 0.31149864196777344, 0.3227958679199219, 0.3340930938720703, 0.34539031982421875, 0.3566875457763672, 0.3679847717285156, 0.37928199768066406, 0.3905792236328125, 0.40187644958496094, 0.4131736755371094, 0.4244709014892578, 0.43576812744140625, 0.4470653533935547, 0.4583625793457031, 0.46965980529785156, 0.48095703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 25.0, 55.0, 144.0, 281.0, 241.0, 144.0, 72.0, 26.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.50307846069336, -19.111434936523438, -18.71979331970215, -18.328149795532227, -17.936508178710938, -17.544864654541016, -17.153221130371094, -16.761579513549805, -16.369935989379883, -15.978293418884277, -15.586650848388672, -15.19500732421875, -14.803364753723145, -14.411722183227539, -14.020079612731934, -13.628437042236328, -13.236794471740723, -12.845151901245117, -12.453509330749512, -12.061866760253906, -11.670223236083984, -11.278580665588379, -10.886938095092773, -10.495295524597168, -10.103652954101562, -9.712010383605957, -9.320367813110352, -8.92872428894043, -8.537081718444824, -8.145439147949219, -7.753796577453613, -7.362154006958008, -6.9705095291137695, -6.578866958618164, -6.1872239112854, -5.795581340789795, -5.403938293457031, -5.012295722961426, -4.62065315246582, -4.229010581970215, -3.837367534637451, -3.4457247257232666, -3.054081916809082, -2.6624393463134766, -2.270796537399292, -1.8791537284851074, -1.487511157989502, -1.0958683490753174, -0.7042255401611328, -0.312582790851593, 0.07905995845794678, 0.4707026481628418, 0.8623454570770264, 1.253988265991211, 1.6456308364868164, 2.037273645401001, 2.4289164543151855, 2.82055926322937, 3.2122020721435547, 3.60384464263916, 3.9954874515533447, 4.387130260467529, 4.778772830963135, 5.170415878295898, 5.562058448791504]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 10.0, 16.0, 14.0, 20.0, 24.0, 30.0, 27.0, 34.0, 43.0, 51.0, 49.0, 55.0, 48.0, 47.0, 71.0, 52.0, 48.0, 47.0, 49.0, 46.0, 23.0, 29.0, 24.0, 27.0, 14.0, 22.0, 14.0, 16.0, 13.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.57539176940918, -4.432658672332764, -4.289925575256348, -4.147192478179932, -4.004459381103516, -3.8617262840270996, -3.7189931869506836, -3.5762600898742676, -3.4335269927978516, -3.2907938957214355, -3.1480607986450195, -3.0053277015686035, -2.8625946044921875, -2.7198615074157715, -2.5771284103393555, -2.4343953132629395, -2.2916624546051025, -2.1489293575286865, -2.0061962604522705, -1.8634631633758545, -1.7207300662994385, -1.5779969692230225, -1.435263991355896, -1.29253089427948, -1.149797797203064, -1.007064700126648, -0.8643316030502319, -0.7215985655784607, -0.5788654685020447, -0.43613237142562866, -0.2933993339538574, -0.1506662368774414, -0.00793313980102539, 0.13479994237422943, 0.27753302454948425, 0.4202660918235779, 0.5629991888999939, 0.7057322859764099, 0.8484653234481812, 0.9911984205245972, 1.1339315176010132, 1.2766646146774292, 1.4193977117538452, 1.5621306896209717, 1.7048637866973877, 1.8475968837738037, 1.9903299808502197, 2.1330630779266357, 2.2757961750030518, 2.4185292720794678, 2.561262369155884, 2.7039954662323, 2.846728563308716, 2.989461660385132, 3.1321945190429688, 3.2749276161193848, 3.417660713195801, 3.560393810272217, 3.703126907348633, 3.845860004425049, 3.988593101501465, 4.131326198577881, 4.274059295654297, 4.416792392730713, 4.559525489807129]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 11.0, 11.0, 12.0, 15.0, 23.0, 34.0, 42.0, 56.0, 64.0, 100.0, 127.0, 175.0, 317.0, 573.0, 1106.0, 2593.0, 7793.0, 32349.0, 628880.0, 3455649.0, 47820.0, 10218.0, 3368.0, 1416.0, 651.0, 304.0, 216.0, 136.0, 74.0, 38.0, 28.0, 15.0, 7.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0], "bins": [-2.875, -2.809814453125, -2.74462890625, -2.679443359375, -2.6142578125, -2.549072265625, -2.48388671875, -2.418701171875, -2.353515625, -2.288330078125, -2.22314453125, -2.157958984375, -2.0927734375, -2.027587890625, -1.96240234375, -1.897216796875, -1.83203125, -1.766845703125, -1.70166015625, -1.636474609375, -1.5712890625, -1.506103515625, -1.44091796875, -1.375732421875, -1.310546875, -1.245361328125, -1.18017578125, -1.114990234375, -1.0498046875, -0.984619140625, -0.91943359375, -0.854248046875, -0.7890625, -0.723876953125, -0.65869140625, -0.593505859375, -0.5283203125, -0.463134765625, -0.39794921875, -0.332763671875, -0.267578125, -0.202392578125, -0.13720703125, -0.072021484375, -0.0068359375, 0.058349609375, 0.12353515625, 0.188720703125, 0.25390625, 0.319091796875, 0.38427734375, 0.449462890625, 0.5146484375, 0.579833984375, 0.64501953125, 0.710205078125, 0.775390625, 0.840576171875, 0.90576171875, 0.970947265625, 1.0361328125, 1.101318359375, 1.16650390625, 1.231689453125, 1.296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 16.0, 13.0, 30.0, 55.0, 56.0, 65.0, 96.0, 80.0, 96.0, 76.0, 91.0, 71.0, 60.0, 62.0, 45.0, 23.0, 18.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41744232177734375, -0.4066619873046875, -0.39588165283203125, -0.385101318359375, -0.37432098388671875, -0.3635406494140625, -0.35276031494140625, -0.34197998046875, -0.33119964599609375, -0.3204193115234375, -0.30963897705078125, -0.298858642578125, -0.28807830810546875, -0.2772979736328125, -0.26651763916015625, -0.2557373046875, -0.24495697021484375, -0.2341766357421875, -0.22339630126953125, -0.212615966796875, -0.20183563232421875, -0.1910552978515625, -0.18027496337890625, -0.16949462890625, -0.15871429443359375, -0.1479339599609375, -0.13715362548828125, -0.126373291015625, -0.11559295654296875, -0.1048126220703125, -0.09403228759765625, -0.083251953125, -0.07247161865234375, -0.0616912841796875, -0.05091094970703125, -0.040130615234375, -0.02935028076171875, -0.0185699462890625, -0.00778961181640625, 0.00299072265625, 0.01377105712890625, 0.0245513916015625, 0.03533172607421875, 0.046112060546875, 0.05689239501953125, 0.0676727294921875, 0.07845306396484375, 0.0892333984375, 0.10001373291015625, 0.1107940673828125, 0.12157440185546875, 0.132354736328125, 0.14313507080078125, 0.1539154052734375, 0.16469573974609375, 0.17547607421875, 0.18625640869140625, 0.1970367431640625, 0.20781707763671875, 0.218597412109375, 0.22937774658203125, 0.2401580810546875, 0.25093841552734375, 0.26171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 11.0, 5.0, 15.0, 10.0, 16.0, 24.0, 46.0, 43.0, 97.0, 125.0, 180.0, 346.0, 610.0, 1130.0, 2483.0, 6044.0, 18418.0, 74643.0, 1214298.0, 2741163.0, 98637.0, 22715.0, 7312.0, 2834.0, 1293.0, 676.0, 393.0, 229.0, 157.0, 93.0, 52.0, 53.0, 29.0, 30.0, 10.0, 20.0, 7.0, 2.0, 4.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.23046875, -1.1908721923828125, -1.151275634765625, -1.1116790771484375, -1.07208251953125, -1.0324859619140625, -0.992889404296875, -0.9532928466796875, -0.9136962890625, -0.8740997314453125, -0.834503173828125, -0.7949066162109375, -0.75531005859375, -0.7157135009765625, -0.676116943359375, -0.6365203857421875, -0.596923828125, -0.5573272705078125, -0.517730712890625, -0.4781341552734375, -0.43853759765625, -0.3989410400390625, -0.359344482421875, -0.3197479248046875, -0.2801513671875, -0.2405548095703125, -0.200958251953125, -0.1613616943359375, -0.12176513671875, -0.0821685791015625, -0.042572021484375, -0.0029754638671875, 0.03662109375, 0.0762176513671875, 0.115814208984375, 0.1554107666015625, 0.19500732421875, 0.2346038818359375, 0.274200439453125, 0.3137969970703125, 0.3533935546875, 0.3929901123046875, 0.432586669921875, 0.4721832275390625, 0.51177978515625, 0.5513763427734375, 0.590972900390625, 0.6305694580078125, 0.670166015625, 0.7097625732421875, 0.749359130859375, 0.7889556884765625, 0.82855224609375, 0.8681488037109375, 0.907745361328125, 0.9473419189453125, 0.9869384765625, 1.0265350341796875, 1.066131591796875, 1.1057281494140625, 1.14532470703125, 1.1849212646484375, 1.224517822265625, 1.2641143798828125, 1.3037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 5.0, 18.0, 14.0, 17.0, 32.0, 39.0, 61.0, 93.0, 191.0, 519.0, 1524.0, 816.0, 297.0, 149.0, 97.0, 52.0, 40.0, 28.0, 12.0, 10.0, 13.0, 12.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3650016784667969, -0.35134124755859375, -0.3376808166503906, -0.3240203857421875, -0.3103599548339844, -0.29669952392578125, -0.2830390930175781, -0.269378662109375, -0.2557182312011719, -0.24205780029296875, -0.22839736938476562, -0.2147369384765625, -0.20107650756835938, -0.18741607666015625, -0.17375564575195312, -0.16009521484375, -0.14643478393554688, -0.13277435302734375, -0.11911392211914062, -0.1054534912109375, -0.09179306030273438, -0.07813262939453125, -0.06447219848632812, -0.050811767578125, -0.037151336669921875, -0.02349090576171875, -0.009830474853515625, 0.0038299560546875, 0.017490386962890625, 0.03115081787109375, 0.044811248779296875, 0.0584716796875, 0.07213211059570312, 0.08579254150390625, 0.09945297241210938, 0.1131134033203125, 0.12677383422851562, 0.14043426513671875, 0.15409469604492188, 0.167755126953125, 0.18141555786132812, 0.19507598876953125, 0.20873641967773438, 0.2223968505859375, 0.23605728149414062, 0.24971771240234375, 0.2633781433105469, 0.27703857421875, 0.2906990051269531, 0.30435943603515625, 0.3180198669433594, 0.3316802978515625, 0.3453407287597656, 0.35900115966796875, 0.3726615905761719, 0.386322021484375, 0.3999824523925781, 0.41364288330078125, 0.4273033142089844, 0.4409637451171875, 0.4546241760253906, 0.46828460693359375, 0.4819450378417969, 0.49560546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 19.0, 76.0, 303.0, 382.0, 163.0, 42.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4266514778137207, -2.1859872341156006, -1.9453227519989014, -1.7046585083007812, -1.4639941453933716, -1.223329782485962, -0.9826655387878418, -0.7420011758804321, -0.5013368129730225, -0.2606724798679352, -0.0200081467628479, 0.220656156539917, 0.46132051944732666, 0.7019848823547363, 0.9426491260528564, 1.1833134889602661, 1.4239778518676758, 1.6646422147750854, 1.9053065776824951, 2.1459708213806152, 2.3866353034973145, 2.6272995471954346, 2.8679637908935547, 3.108628273010254, 3.349292516708374, 3.589956760406494, 3.8306212425231934, 4.071285247802734, 4.311949729919434, 4.552614212036133, 4.793278694152832, 5.033942699432373, 5.274606704711914, 5.515271186828613, 5.755935192108154, 5.9965996742248535, 6.237264156341553, 6.477928161621094, 6.718592643737793, 6.959257125854492, 7.199921607971191, 7.440586090087891, 7.681250095367432, 7.921914577484131, 8.162578582763672, 8.403243064880371, 8.64390754699707, 8.88457202911377, 9.125236511230469, 9.365900993347168, 9.606565475463867, 9.84722900390625, 10.08789348602295, 10.328557968139648, 10.569222450256348, 10.809886932373047, 11.05055046081543, 11.291214942932129, 11.531879425048828, 11.772542953491211, 12.01320743560791, 12.25387191772461, 12.494536399841309, 12.735200881958008, 12.975865364074707]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 11.0, 8.0, 11.0, 12.0, 22.0, 24.0, 28.0, 36.0, 49.0, 37.0, 49.0, 47.0, 50.0, 48.0, 54.0, 61.0, 54.0, 54.0, 52.0, 43.0, 45.0, 43.0, 26.0, 30.0, 28.0, 16.0, 19.0, 6.0, 8.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4040803909301758, -1.3527841567993164, -1.301487922668457, -1.2501916885375977, -1.1988954544067383, -1.147599220275879, -1.09630286693573, -1.0450066328048706, -0.9937103986740112, -0.9424141645431519, -0.8911179304122925, -0.8398216366767883, -0.788525402545929, -0.7372291684150696, -0.6859328746795654, -0.634636640548706, -0.5833404064178467, -0.5320441722869873, -0.48074790835380554, -0.4294516444206238, -0.3781554102897644, -0.32685917615890503, -0.27556291222572327, -0.2242666482925415, -0.17297041416168213, -0.12167416512966156, -0.07037791609764099, -0.019081667065620422, 0.032214581966400146, 0.08351081609725952, 0.13480708003044128, 0.18610334396362305, 0.23739969730377197, 0.28869593143463135, 0.3399921953678131, 0.3912884593009949, 0.44258469343185425, 0.4938809275627136, 0.5451772212982178, 0.5964734554290771, 0.6477696895599365, 0.6990659236907959, 0.7503621578216553, 0.8016584515571594, 0.8529546856880188, 0.9042509198188782, 0.9555472135543823, 1.0068434476852417, 1.058139681816101, 1.1094359159469604, 1.1607321500778198, 1.2120283842086792, 1.2633247375488281, 1.3146209716796875, 1.3659172058105469, 1.4172134399414062, 1.4685096740722656, 1.519805908203125, 1.5711021423339844, 1.6223983764648438, 1.6736946105957031, 1.7249908447265625, 1.7762871980667114, 1.8275834321975708, 1.8788796663284302]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 13.0, 15.0, 13.0, 28.0, 45.0, 55.0, 91.0, 150.0, 277.0, 521.0, 1187.0, 3159.0, 12052.0, 77991.0, 585883.0, 321296.0, 34956.0, 6832.0, 2104.0, 866.0, 426.0, 216.0, 119.0, 72.0, 56.0, 33.0, 26.0, 15.0, 12.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6812591552734375, -1.613494873046875, -1.5457305908203125, -1.47796630859375, -1.4102020263671875, -1.342437744140625, -1.2746734619140625, -1.2069091796875, -1.1391448974609375, -1.071380615234375, -1.0036163330078125, -0.93585205078125, -0.8680877685546875, -0.800323486328125, -0.7325592041015625, -0.664794921875, -0.5970306396484375, -0.529266357421875, -0.4615020751953125, -0.39373779296875, -0.3259735107421875, -0.258209228515625, -0.1904449462890625, -0.1226806640625, -0.0549163818359375, 0.012847900390625, 0.0806121826171875, 0.14837646484375, 0.2161407470703125, 0.283905029296875, 0.3516693115234375, 0.41943359375, 0.4871978759765625, 0.554962158203125, 0.6227264404296875, 0.69049072265625, 0.7582550048828125, 0.826019287109375, 0.8937835693359375, 0.9615478515625, 1.0293121337890625, 1.097076416015625, 1.1648406982421875, 1.23260498046875, 1.3003692626953125, 1.368133544921875, 1.4358978271484375, 1.503662109375, 1.5714263916015625, 1.639190673828125, 1.7069549560546875, 1.77471923828125, 1.8424835205078125, 1.910247802734375, 1.9780120849609375, 2.0457763671875, 2.1135406494140625, 2.181304931640625, 2.2490692138671875, 2.31683349609375, 2.3845977783203125, 2.452362060546875, 2.5201263427734375, 2.587890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 16.0, 25.0, 45.0, 60.0, 57.0, 79.0, 81.0, 92.0, 97.0, 77.0, 78.0, 76.0, 58.0, 43.0, 32.0, 20.0, 15.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43359375, -0.4227867126464844, -0.41197967529296875, -0.4011726379394531, -0.3903656005859375, -0.3795585632324219, -0.36875152587890625, -0.3579444885253906, -0.347137451171875, -0.3363304138183594, -0.32552337646484375, -0.3147163391113281, -0.3039093017578125, -0.2931022644042969, -0.28229522705078125, -0.2714881896972656, -0.26068115234375, -0.24987411499023438, -0.23906707763671875, -0.22826004028320312, -0.2174530029296875, -0.20664596557617188, -0.19583892822265625, -0.18503189086914062, -0.174224853515625, -0.16341781616210938, -0.15261077880859375, -0.14180374145507812, -0.1309967041015625, -0.12018966674804688, -0.10938262939453125, -0.09857559204101562, -0.0877685546875, -0.07696151733398438, -0.06615447998046875, -0.055347442626953125, -0.0445404052734375, -0.033733367919921875, -0.02292633056640625, -0.012119293212890625, -0.001312255859375, 0.009494781494140625, 0.02030181884765625, 0.031108856201171875, 0.0419158935546875, 0.052722930908203125, 0.06352996826171875, 0.07433700561523438, 0.08514404296875, 0.09595108032226562, 0.10675811767578125, 0.11756515502929688, 0.1283721923828125, 0.13917922973632812, 0.14998626708984375, 0.16079330444335938, 0.171600341796875, 0.18240737915039062, 0.19321441650390625, 0.20402145385742188, 0.2148284912109375, 0.22563552856445312, 0.23644256591796875, 0.24724960327148438, 0.258056640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 8.0, 5.0, 5.0, 8.0, 3.0, 6.0, 10.0, 10.0, 16.0, 38.0, 44.0, 82.0, 168.0, 283.0, 581.0, 1340.0, 3710.0, 11489.0, 44796.0, 206902.0, 510060.0, 206784.0, 44331.0, 11613.0, 3668.0, 1423.0, 545.0, 253.0, 132.0, 74.0, 50.0, 34.0, 20.0, 14.0, 15.0, 5.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9486465454101562, -0.9153594970703125, -0.8820724487304688, -0.848785400390625, -0.8154983520507812, -0.7822113037109375, -0.7489242553710938, -0.71563720703125, -0.6823501586914062, -0.6490631103515625, -0.6157760620117188, -0.582489013671875, -0.5492019653320312, -0.5159149169921875, -0.48262786865234375, -0.4493408203125, -0.41605377197265625, -0.3827667236328125, -0.34947967529296875, -0.316192626953125, -0.28290557861328125, -0.2496185302734375, -0.21633148193359375, -0.18304443359375, -0.14975738525390625, -0.1164703369140625, -0.08318328857421875, -0.049896240234375, -0.01660919189453125, 0.0166778564453125, 0.04996490478515625, 0.083251953125, 0.11653900146484375, 0.1498260498046875, 0.18311309814453125, 0.216400146484375, 0.24968719482421875, 0.2829742431640625, 0.31626129150390625, 0.34954833984375, 0.38283538818359375, 0.4161224365234375, 0.44940948486328125, 0.482696533203125, 0.5159835815429688, 0.5492706298828125, 0.5825576782226562, 0.6158447265625, 0.6491317749023438, 0.6824188232421875, 0.7157058715820312, 0.748992919921875, 0.7822799682617188, 0.8155670166015625, 0.8488540649414062, 0.88214111328125, 0.9154281616210938, 0.9487152099609375, 0.9820022583007812, 1.015289306640625, 1.0485763549804688, 1.0818634033203125, 1.1151504516601562, 1.1484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 5.0, 10.0, 14.0, 10.0, 17.0, 19.0, 19.0, 33.0, 28.0, 29.0, 26.0, 23.0, 43.0, 49.0, 35.0, 48.0, 47.0, 46.0, 41.0, 39.0, 46.0, 40.0, 43.0, 43.0, 33.0, 29.0, 24.0, 21.0, 17.0, 12.0, 18.0, 17.0, 8.0, 4.0, 12.0, 4.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.814453125, -0.790679931640625, -0.76690673828125, -0.743133544921875, -0.7193603515625, -0.695587158203125, -0.67181396484375, -0.648040771484375, -0.624267578125, -0.600494384765625, -0.57672119140625, -0.552947998046875, -0.5291748046875, -0.505401611328125, -0.48162841796875, -0.457855224609375, -0.43408203125, -0.410308837890625, -0.38653564453125, -0.362762451171875, -0.3389892578125, -0.315216064453125, -0.29144287109375, -0.267669677734375, -0.243896484375, -0.220123291015625, -0.19635009765625, -0.172576904296875, -0.1488037109375, -0.125030517578125, -0.10125732421875, -0.077484130859375, -0.0537109375, -0.029937744140625, -0.00616455078125, 0.017608642578125, 0.0413818359375, 0.065155029296875, 0.08892822265625, 0.112701416015625, 0.136474609375, 0.160247802734375, 0.18402099609375, 0.207794189453125, 0.2315673828125, 0.255340576171875, 0.27911376953125, 0.302886962890625, 0.32666015625, 0.350433349609375, 0.37420654296875, 0.397979736328125, 0.4217529296875, 0.445526123046875, 0.46929931640625, 0.493072509765625, 0.516845703125, 0.540618896484375, 0.56439208984375, 0.588165283203125, 0.6119384765625, 0.635711669921875, 0.65948486328125, 0.683258056640625, 0.70703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 4.0, 4.0, 17.0, 21.0, 43.0, 60.0, 130.0, 277.0, 639.0, 1901.0, 8414.0, 70141.0, 717466.0, 226563.0, 17770.0, 3346.0, 941.0, 383.0, 167.0, 96.0, 59.0, 38.0, 25.0, 17.0, 4.0, 9.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.9381942749023438, -0.9076385498046875, -0.8770828247070312, -0.846527099609375, -0.8159713745117188, -0.7854156494140625, -0.7548599243164062, -0.72430419921875, -0.6937484741210938, -0.6631927490234375, -0.6326370239257812, -0.602081298828125, -0.5715255737304688, -0.5409698486328125, -0.5104141235351562, -0.4798583984375, -0.44930267333984375, -0.4187469482421875, -0.38819122314453125, -0.357635498046875, -0.32707977294921875, -0.2965240478515625, -0.26596832275390625, -0.23541259765625, -0.20485687255859375, -0.1743011474609375, -0.14374542236328125, -0.113189697265625, -0.08263397216796875, -0.0520782470703125, -0.02152252197265625, 0.009033203125, 0.03958892822265625, 0.0701446533203125, 0.10070037841796875, 0.131256103515625, 0.16181182861328125, 0.1923675537109375, 0.22292327880859375, 0.25347900390625, 0.28403472900390625, 0.3145904541015625, 0.34514617919921875, 0.375701904296875, 0.40625762939453125, 0.4368133544921875, 0.46736907958984375, 0.4979248046875, 0.5284805297851562, 0.5590362548828125, 0.5895919799804688, 0.620147705078125, 0.6507034301757812, 0.6812591552734375, 0.7118148803710938, 0.74237060546875, 0.7729263305664062, 0.8034820556640625, 0.8340377807617188, 0.864593505859375, 0.8951492309570312, 0.9257049560546875, 0.9562606811523438, 0.98681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 7.0, 6.0, 6.0, 10.0, 12.0, 14.0, 31.0, 30.0, 50.0, 53.0, 73.0, 63.0, 84.0, 88.0, 92.0, 77.0, 74.0, 48.0, 50.0, 27.0, 22.0, 17.0, 14.0, 12.0, 11.0, 6.0, 5.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00011146068572998047, -0.00010842457413673401, -0.00010538846254348755, -0.00010235235095024109, -9.931623935699463e-05, -9.628012776374817e-05, -9.324401617050171e-05, -9.020790457725525e-05, -8.717179298400879e-05, -8.413568139076233e-05, -8.109956979751587e-05, -7.806345820426941e-05, -7.502734661102295e-05, -7.199123501777649e-05, -6.895512342453003e-05, -6.591901183128357e-05, -6.288290023803711e-05, -5.984678864479065e-05, -5.681067705154419e-05, -5.377456545829773e-05, -5.073845386505127e-05, -4.770234227180481e-05, -4.466623067855835e-05, -4.163011908531189e-05, -3.859400749206543e-05, -3.555789589881897e-05, -3.252178430557251e-05, -2.948567271232605e-05, -2.644956111907959e-05, -2.341344952583313e-05, -2.037733793258667e-05, -1.734122633934021e-05, -1.430511474609375e-05, -1.126900315284729e-05, -8.23289155960083e-06, -5.19677996635437e-06, -2.16066837310791e-06, 8.754432201385498e-07, 3.91155481338501e-06, 6.94766640663147e-06, 9.98377799987793e-06, 1.301988959312439e-05, 1.605600118637085e-05, 1.909211277961731e-05, 2.212822437286377e-05, 2.516433596611023e-05, 2.820044755935669e-05, 3.123655915260315e-05, 3.427267074584961e-05, 3.730878233909607e-05, 4.034489393234253e-05, 4.338100552558899e-05, 4.641711711883545e-05, 4.945322871208191e-05, 5.248934030532837e-05, 5.552545189857483e-05, 5.856156349182129e-05, 6.159767508506775e-05, 6.463378667831421e-05, 6.766989827156067e-05, 7.070600986480713e-05, 7.374212145805359e-05, 7.677823305130005e-05, 7.981434464454651e-05, 8.285045623779297e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 7.0, 14.0, 15.0, 30.0, 38.0, 61.0, 134.0, 238.0, 570.0, 1886.0, 9262.0, 107892.0, 785562.0, 129213.0, 10449.0, 2011.0, 632.0, 257.0, 109.0, 72.0, 39.0, 24.0, 13.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.5749282836914062, -0.5438995361328125, -0.5128707885742188, -0.481842041015625, -0.45081329345703125, -0.4197845458984375, -0.38875579833984375, -0.35772705078125, -0.32669830322265625, -0.2956695556640625, -0.26464080810546875, -0.233612060546875, -0.20258331298828125, -0.1715545654296875, -0.14052581787109375, -0.1094970703125, -0.07846832275390625, -0.0474395751953125, -0.01641082763671875, 0.014617919921875, 0.04564666748046875, 0.0766754150390625, 0.10770416259765625, 0.13873291015625, 0.16976165771484375, 0.2007904052734375, 0.23181915283203125, 0.262847900390625, 0.29387664794921875, 0.3249053955078125, 0.35593414306640625, 0.386962890625, 0.41799163818359375, 0.4490203857421875, 0.48004913330078125, 0.511077880859375, 0.5421066284179688, 0.5731353759765625, 0.6041641235351562, 0.63519287109375, 0.6662216186523438, 0.6972503662109375, 0.7282791137695312, 0.759307861328125, 0.7903366088867188, 0.8213653564453125, 0.8523941040039062, 0.8834228515625, 0.9144515991210938, 0.9454803466796875, 0.9765090942382812, 1.007537841796875, 1.0385665893554688, 1.0695953369140625, 1.1006240844726562, 1.13165283203125, 1.1626815795898438, 1.1937103271484375, 1.2247390747070312, 1.255767822265625, 1.2867965698242188, 1.3178253173828125, 1.3488540649414062, 1.3798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 10.0, 14.0, 19.0, 16.0, 23.0, 24.0, 53.0, 45.0, 59.0, 90.0, 70.0, 87.0, 82.0, 65.0, 64.0, 61.0, 50.0, 52.0, 28.0, 18.0, 11.0, 15.0, 9.0, 8.0, 4.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.32982635498046875, -0.3171234130859375, -0.30442047119140625, -0.291717529296875, -0.27901458740234375, -0.2663116455078125, -0.25360870361328125, -0.24090576171875, -0.22820281982421875, -0.2154998779296875, -0.20279693603515625, -0.190093994140625, -0.17739105224609375, -0.1646881103515625, -0.15198516845703125, -0.1392822265625, -0.12657928466796875, -0.1138763427734375, -0.10117340087890625, -0.088470458984375, -0.07576751708984375, -0.0630645751953125, -0.05036163330078125, -0.03765869140625, -0.02495574951171875, -0.0122528076171875, 0.00045013427734375, 0.013153076171875, 0.02585601806640625, 0.0385589599609375, 0.05126190185546875, 0.06396484375, 0.07666778564453125, 0.0893707275390625, 0.10207366943359375, 0.114776611328125, 0.12747955322265625, 0.1401824951171875, 0.15288543701171875, 0.16558837890625, 0.17829132080078125, 0.1909942626953125, 0.20369720458984375, 0.216400146484375, 0.22910308837890625, 0.2418060302734375, 0.25450897216796875, 0.2672119140625, 0.27991485595703125, 0.2926177978515625, 0.30532073974609375, 0.318023681640625, 0.33072662353515625, 0.3434295654296875, 0.35613250732421875, 0.36883544921875, 0.38153839111328125, 0.3942413330078125, 0.40694427490234375, 0.419647216796875, 0.43235015869140625, 0.4450531005859375, 0.45775604248046875, 0.470458984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 36.0, 168.0, 315.0, 288.0, 115.0, 39.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.353282928466797, -16.82286262512207, -16.29244041442871, -15.762019157409668, -15.231597900390625, -14.701176643371582, -14.170755386352539, -13.640335083007812, -13.109912872314453, -12.57949161529541, -12.049070358276367, -11.518649101257324, -10.988227844238281, -10.457806587219238, -9.927385330200195, -9.396965026855469, -8.866543769836426, -8.336122512817383, -7.80570125579834, -7.275279998779297, -6.744858741760254, -6.214437484741211, -5.684016704559326, -5.153595447540283, -4.62317419052124, -4.092752933502197, -3.5623316764831543, -3.0319106578826904, -2.5014894008636475, -1.9710681438446045, -1.4406471252441406, -0.9102258682250977, -0.3798046112060547, 0.1506165862083435, 0.6810377836227417, 1.2114589214324951, 1.741880178451538, 2.272301435470581, 2.802722454071045, 3.333143711090088, 3.863564968109131, 4.393986225128174, 4.924407482147217, 5.454828262329102, 5.9852495193481445, 6.5156707763671875, 7.0460920333862305, 7.576513290405273, 8.106934547424316, 8.63735580444336, 9.167777061462402, 9.698198318481445, 10.228619575500488, 10.759040832519531, 11.289461135864258, 11.819883346557617, 12.350303649902344, 12.880724906921387, 13.41114616394043, 13.941567420959473, 14.471988677978516, 15.002409934997559, 15.532831192016602, 16.063251495361328, 16.593673706054688]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 9.0, 8.0, 10.0, 19.0, 15.0, 19.0, 22.0, 27.0, 36.0, 35.0, 43.0, 42.0, 44.0, 42.0, 59.0, 49.0, 39.0, 43.0, 48.0, 54.0, 54.0, 45.0, 31.0, 35.0, 20.0, 27.0, 15.0, 21.0, 17.0, 13.0, 14.0, 10.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.109270095825195, -4.95625114440918, -4.803232192993164, -4.650213241577148, -4.497194290161133, -4.344175338745117, -4.191156387329102, -4.038137435913086, -3.8851184844970703, -3.7320995330810547, -3.579080581665039, -3.4260616302490234, -3.273042678833008, -3.120023727416992, -2.9670047760009766, -2.813985824584961, -2.6609668731689453, -2.5079479217529297, -2.354928970336914, -2.2019100189208984, -2.048891067504883, -1.8958721160888672, -1.7428531646728516, -1.589834213256836, -1.4368152618408203, -1.2837963104248047, -1.130777359008789, -0.9777584075927734, -0.8247394561767578, -0.6717205047607422, -0.5187015533447266, -0.36568260192871094, -0.2126631736755371, -0.059644222259521484, 0.09337472915649414, 0.24639368057250977, 0.3994126319885254, 0.552431583404541, 0.7054505348205566, 0.8584694862365723, 1.011488437652588, 1.1645073890686035, 1.3175263404846191, 1.4705452919006348, 1.6235642433166504, 1.776583194732666, 1.9296021461486816, 2.0826210975646973, 2.235640048980713, 2.3886590003967285, 2.541677951812744, 2.6946969032287598, 2.8477158546447754, 3.000734806060791, 3.1537537574768066, 3.3067727088928223, 3.459791660308838, 3.6128106117248535, 3.765829563140869, 3.9188485145568848, 4.0718674659729, 4.224886417388916, 4.377905368804932, 4.530924320220947, 4.683943271636963]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 5.0, 8.0, 6.0, 13.0, 15.0, 19.0, 29.0, 36.0, 26.0, 49.0, 57.0, 79.0, 121.0, 172.0, 274.0, 452.0, 857.0, 1950.0, 4645.0, 12776.0, 53479.0, 3325528.0, 737903.0, 37828.0, 10382.0, 3959.0, 1663.0, 816.0, 439.0, 244.0, 163.0, 81.0, 63.0, 42.0, 25.0, 21.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.779296875, -2.7129669189453125, -2.646636962890625, -2.5803070068359375, -2.51397705078125, -2.4476470947265625, -2.381317138671875, -2.3149871826171875, -2.2486572265625, -2.1823272705078125, -2.115997314453125, -2.0496673583984375, -1.98333740234375, -1.9170074462890625, -1.850677490234375, -1.7843475341796875, -1.718017578125, -1.6516876220703125, -1.585357666015625, -1.5190277099609375, -1.45269775390625, -1.3863677978515625, -1.320037841796875, -1.2537078857421875, -1.1873779296875, -1.1210479736328125, -1.054718017578125, -0.9883880615234375, -0.92205810546875, -0.8557281494140625, -0.789398193359375, -0.7230682373046875, -0.65673828125, -0.5904083251953125, -0.524078369140625, -0.4577484130859375, -0.39141845703125, -0.3250885009765625, -0.258758544921875, -0.1924285888671875, -0.1260986328125, -0.0597686767578125, 0.006561279296875, 0.0728912353515625, 0.13922119140625, 0.2055511474609375, 0.271881103515625, 0.3382110595703125, 0.404541015625, 0.4708709716796875, 0.537200927734375, 0.6035308837890625, 0.66986083984375, 0.7361907958984375, 0.802520751953125, 0.8688507080078125, 0.9351806640625, 1.0015106201171875, 1.067840576171875, 1.1341705322265625, 1.20050048828125, 1.2668304443359375, 1.333160400390625, 1.3994903564453125, 1.4658203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 29.0, 38.0, 36.0, 39.0, 65.0, 64.0, 69.0, 71.0, 90.0, 81.0, 73.0, 53.0, 45.0, 50.0, 43.0, 35.0, 18.0, 13.0, 18.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.3876953125, -0.377593994140625, -0.36749267578125, -0.357391357421875, -0.3472900390625, -0.337188720703125, -0.32708740234375, -0.316986083984375, -0.306884765625, -0.296783447265625, -0.28668212890625, -0.276580810546875, -0.2664794921875, -0.256378173828125, -0.24627685546875, -0.236175537109375, -0.22607421875, -0.215972900390625, -0.20587158203125, -0.195770263671875, -0.1856689453125, -0.175567626953125, -0.16546630859375, -0.155364990234375, -0.145263671875, -0.135162353515625, -0.12506103515625, -0.114959716796875, -0.1048583984375, -0.094757080078125, -0.08465576171875, -0.074554443359375, -0.064453125, -0.054351806640625, -0.04425048828125, -0.034149169921875, -0.0240478515625, -0.013946533203125, -0.00384521484375, 0.006256103515625, 0.016357421875, 0.026458740234375, 0.03656005859375, 0.046661376953125, 0.0567626953125, 0.066864013671875, 0.07696533203125, 0.087066650390625, 0.09716796875, 0.107269287109375, 0.11737060546875, 0.127471923828125, 0.1375732421875, 0.147674560546875, 0.15777587890625, 0.167877197265625, 0.177978515625, 0.188079833984375, 0.19818115234375, 0.208282470703125, 0.2183837890625, 0.228485107421875, 0.23858642578125, 0.248687744140625, 0.2587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 10.0, 9.0, 10.0, 29.0, 42.0, 53.0, 97.0, 146.0, 261.0, 569.0, 1415.0, 4227.0, 17258.0, 161839.0, 3851704.0, 134432.0, 15570.0, 4133.0, 1331.0, 528.0, 274.0, 126.0, 74.0, 49.0, 35.0, 17.0, 13.0, 13.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.8515625, -2.782806396484375, -2.71405029296875, -2.645294189453125, -2.5765380859375, -2.507781982421875, -2.43902587890625, -2.370269775390625, -2.301513671875, -2.232757568359375, -2.16400146484375, -2.095245361328125, -2.0264892578125, -1.957733154296875, -1.88897705078125, -1.820220947265625, -1.75146484375, -1.682708740234375, -1.61395263671875, -1.545196533203125, -1.4764404296875, -1.407684326171875, -1.33892822265625, -1.270172119140625, -1.201416015625, -1.132659912109375, -1.06390380859375, -0.995147705078125, -0.9263916015625, -0.857635498046875, -0.78887939453125, -0.720123291015625, -0.6513671875, -0.582611083984375, -0.51385498046875, -0.445098876953125, -0.3763427734375, -0.307586669921875, -0.23883056640625, -0.170074462890625, -0.101318359375, -0.032562255859375, 0.03619384765625, 0.104949951171875, 0.1737060546875, 0.242462158203125, 0.31121826171875, 0.379974365234375, 0.44873046875, 0.517486572265625, 0.58624267578125, 0.654998779296875, 0.7237548828125, 0.792510986328125, 0.86126708984375, 0.930023193359375, 0.998779296875, 1.067535400390625, 1.13629150390625, 1.205047607421875, 1.2738037109375, 1.342559814453125, 1.41131591796875, 1.480072021484375, 1.548828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 12.0, 9.0, 11.0, 12.0, 15.0, 21.0, 39.0, 61.0, 92.0, 157.0, 335.0, 939.0, 1501.0, 441.0, 171.0, 101.0, 54.0, 30.0, 16.0, 9.0, 15.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7169952392578125, -0.697174072265625, -0.6773529052734375, -0.65753173828125, -0.6377105712890625, -0.617889404296875, -0.5980682373046875, -0.5782470703125, -0.5584259033203125, -0.538604736328125, -0.5187835693359375, -0.49896240234375, -0.4791412353515625, -0.459320068359375, -0.4394989013671875, -0.419677734375, -0.3998565673828125, -0.380035400390625, -0.3602142333984375, -0.34039306640625, -0.3205718994140625, -0.300750732421875, -0.2809295654296875, -0.2611083984375, -0.2412872314453125, -0.221466064453125, -0.2016448974609375, -0.18182373046875, -0.1620025634765625, -0.142181396484375, -0.1223602294921875, -0.1025390625, -0.0827178955078125, -0.062896728515625, -0.0430755615234375, -0.02325439453125, -0.0034332275390625, 0.016387939453125, 0.0362091064453125, 0.0560302734375, 0.0758514404296875, 0.095672607421875, 0.1154937744140625, 0.13531494140625, 0.1551361083984375, 0.174957275390625, 0.1947784423828125, 0.214599609375, 0.2344207763671875, 0.254241943359375, 0.2740631103515625, 0.29388427734375, 0.3137054443359375, 0.333526611328125, 0.3533477783203125, 0.3731689453125, 0.3929901123046875, 0.412811279296875, 0.4326324462890625, 0.45245361328125, 0.4722747802734375, 0.492095947265625, 0.5119171142578125, 0.53173828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 16.0, 36.0, 62.0, 96.0, 186.0, 221.0, 162.0, 122.0, 45.0, 19.0, 7.0, 8.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845273971557617, -5.666065692901611, -5.486856937408447, -5.307648658752441, -5.1284403800964355, -4.94923210144043, -4.770023345947266, -4.59081506729126, -4.411606788635254, -4.232398509979248, -4.053189754486084, -3.873981475830078, -3.6947731971740723, -3.5155646800994873, -3.3363561630249023, -3.1571478843688965, -2.9779391288757324, -2.7987306118011475, -2.6195223331451416, -2.4403138160705566, -2.261105537414551, -2.081897020339966, -1.9026885032653809, -1.7234801054000854, -1.54427170753479, -1.3650633096694946, -1.1858549118041992, -1.0066463947296143, -0.8274379968643188, -0.6482295989990234, -0.4690210819244385, -0.28981268405914307, -0.11060380935668945, 0.06860461831092834, 0.24781304597854614, 0.42702150344848633, 0.6062299013137817, 0.7854382991790771, 0.9646468162536621, 1.1438552141189575, 1.323063611984253, 1.5022720098495483, 1.6814804077148438, 1.8606889247894287, 2.0398974418640137, 2.2191057205200195, 2.3983142375946045, 2.5775227546691895, 2.7567310333251953, 2.9359395503997803, 3.115147829055786, 3.294356346130371, 3.473564624786377, 3.652773141860962, 3.831981658935547, 4.011189937591553, 4.190398216247559, 4.3696064949035645, 4.5488152503967285, 4.728023529052734, 4.90723180770874, 5.086440086364746, 5.26564884185791, 5.444857120513916, 5.62406587600708]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 3.0, 13.0, 6.0, 12.0, 17.0, 21.0, 24.0, 40.0, 45.0, 49.0, 46.0, 66.0, 53.0, 62.0, 59.0, 57.0, 68.0, 76.0, 57.0, 42.0, 49.0, 43.0, 27.0, 19.0, 14.0, 13.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.837348222732544, -1.7499698400497437, -1.6625914573669434, -1.5752129554748535, -1.4878345727920532, -1.400456190109253, -1.3130778074264526, -1.2256994247436523, -1.1383209228515625, -1.0509425401687622, -0.9635640978813171, -0.8761857151985168, -0.7888072729110718, -0.7014288902282715, -0.6140505075454712, -0.5266720652580261, -0.4392937421798706, -0.3519153296947479, -0.26453691720962524, -0.17715853452682495, -0.08978012204170227, -0.00240170955657959, 0.0849766731262207, 0.17235511541366577, 0.25973349809646606, 0.34711191058158875, 0.4344903230667114, 0.5218687057495117, 0.609247088432312, 0.6966255307197571, 0.7840039134025574, 0.8713823556900024, 0.9587607383728027, 1.046139121055603, 1.1335175037384033, 1.2208960056304932, 1.3082743883132935, 1.3956527709960938, 1.483031153678894, 1.5704095363616943, 1.6577880382537842, 1.7451664209365845, 1.8325448036193848, 1.9199233055114746, 2.0073015689849854, 2.094680070877075, 2.182058334350586, 2.269436836242676, 2.3568153381347656, 2.4441938400268555, 2.531572103500366, 2.618950605392456, 2.706328868865967, 2.7937073707580566, 2.8810858726501465, 2.9684641361236572, 3.055842399597168, 3.143220901489258, 3.2305991649627686, 3.3179776668548584, 3.405355930328369, 3.492734432220459, 3.580112934112549, 3.6674911975860596, 3.7548696994781494]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 16.0, 23.0, 35.0, 48.0, 66.0, 141.0, 323.0, 697.0, 1792.0, 6236.0, 33286.0, 455555.0, 503910.0, 36421.0, 6647.0, 1953.0, 682.0, 285.0, 157.0, 84.0, 60.0, 32.0, 28.0, 15.0, 10.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.90234375, -2.823944091796875, -2.74554443359375, -2.667144775390625, -2.5887451171875, -2.510345458984375, -2.43194580078125, -2.353546142578125, -2.275146484375, -2.196746826171875, -2.11834716796875, -2.039947509765625, -1.9615478515625, -1.883148193359375, -1.80474853515625, -1.726348876953125, -1.64794921875, -1.569549560546875, -1.49114990234375, -1.412750244140625, -1.3343505859375, -1.255950927734375, -1.17755126953125, -1.099151611328125, -1.020751953125, -0.942352294921875, -0.86395263671875, -0.785552978515625, -0.7071533203125, -0.628753662109375, -0.55035400390625, -0.471954345703125, -0.3935546875, -0.315155029296875, -0.23675537109375, -0.158355712890625, -0.0799560546875, -0.001556396484375, 0.07684326171875, 0.155242919921875, 0.233642578125, 0.312042236328125, 0.39044189453125, 0.468841552734375, 0.5472412109375, 0.625640869140625, 0.70404052734375, 0.782440185546875, 0.86083984375, 0.939239501953125, 1.01763916015625, 1.096038818359375, 1.1744384765625, 1.252838134765625, 1.33123779296875, 1.409637451171875, 1.488037109375, 1.566436767578125, 1.64483642578125, 1.723236083984375, 1.8016357421875, 1.880035400390625, 1.95843505859375, 2.036834716796875, 2.115234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 11.0, 13.0, 13.0, 25.0, 43.0, 45.0, 46.0, 49.0, 71.0, 55.0, 82.0, 92.0, 74.0, 77.0, 60.0, 53.0, 44.0, 46.0, 22.0, 22.0, 14.0, 11.0, 12.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.412353515625, -0.4012794494628906, -0.39020538330078125, -0.3791313171386719, -0.3680572509765625, -0.3569831848144531, -0.34590911865234375, -0.3348350524902344, -0.323760986328125, -0.3126869201660156, -0.30161285400390625, -0.2905387878417969, -0.2794647216796875, -0.2683906555175781, -0.25731658935546875, -0.24624252319335938, -0.23516845703125, -0.22409439086914062, -0.21302032470703125, -0.20194625854492188, -0.1908721923828125, -0.17979812622070312, -0.16872406005859375, -0.15764999389648438, -0.146575927734375, -0.13550186157226562, -0.12442779541015625, -0.11335372924804688, -0.1022796630859375, -0.09120559692382812, -0.08013153076171875, -0.06905746459960938, -0.0579833984375, -0.046909332275390625, -0.03583526611328125, -0.024761199951171875, -0.0136871337890625, -0.002613067626953125, 0.00846099853515625, 0.019535064697265625, 0.030609130859375, 0.041683197021484375, 0.05275726318359375, 0.06383132934570312, 0.0749053955078125, 0.08597946166992188, 0.09705352783203125, 0.10812759399414062, 0.11920166015625, 0.13027572631835938, 0.14134979248046875, 0.15242385864257812, 0.1634979248046875, 0.17457199096679688, 0.18564605712890625, 0.19672012329101562, 0.207794189453125, 0.21886825561523438, 0.22994232177734375, 0.24101638793945312, 0.2520904541015625, 0.2631645202636719, 0.27423858642578125, 0.2853126525878906, 0.29638671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 8.0, 11.0, 21.0, 31.0, 36.0, 52.0, 110.0, 186.0, 386.0, 948.0, 2782.0, 10089.0, 54059.0, 419163.0, 480419.0, 63717.0, 11435.0, 3022.0, 1041.0, 444.0, 212.0, 98.0, 57.0, 50.0, 28.0, 21.0, 14.0, 15.0, 14.0, 10.0, 10.0, 7.0, 11.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5634765625, -1.517547607421875, -1.47161865234375, -1.425689697265625, -1.3797607421875, -1.333831787109375, -1.28790283203125, -1.241973876953125, -1.196044921875, -1.150115966796875, -1.10418701171875, -1.058258056640625, -1.0123291015625, -0.966400146484375, -0.92047119140625, -0.874542236328125, -0.82861328125, -0.782684326171875, -0.73675537109375, -0.690826416015625, -0.6448974609375, -0.598968505859375, -0.55303955078125, -0.507110595703125, -0.461181640625, -0.415252685546875, -0.36932373046875, -0.323394775390625, -0.2774658203125, -0.231536865234375, -0.18560791015625, -0.139678955078125, -0.09375, -0.047821044921875, -0.00189208984375, 0.044036865234375, 0.0899658203125, 0.135894775390625, 0.18182373046875, 0.227752685546875, 0.273681640625, 0.319610595703125, 0.36553955078125, 0.411468505859375, 0.4573974609375, 0.503326416015625, 0.54925537109375, 0.595184326171875, 0.64111328125, 0.687042236328125, 0.73297119140625, 0.778900146484375, 0.8248291015625, 0.870758056640625, 0.91668701171875, 0.962615966796875, 1.008544921875, 1.054473876953125, 1.10040283203125, 1.146331787109375, 1.1922607421875, 1.238189697265625, 1.28411865234375, 1.330047607421875, 1.3759765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 5.0, 11.0, 13.0, 15.0, 22.0, 28.0, 24.0, 27.0, 28.0, 30.0, 40.0, 54.0, 68.0, 48.0, 39.0, 70.0, 47.0, 74.0, 54.0, 48.0, 44.0, 38.0, 29.0, 20.0, 23.0, 16.0, 16.0, 15.0, 13.0, 5.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.978515625, -0.9448089599609375, -0.911102294921875, -0.8773956298828125, -0.84368896484375, -0.8099822998046875, -0.776275634765625, -0.7425689697265625, -0.7088623046875, -0.6751556396484375, -0.641448974609375, -0.6077423095703125, -0.57403564453125, -0.5403289794921875, -0.506622314453125, -0.4729156494140625, -0.439208984375, -0.4055023193359375, -0.371795654296875, -0.3380889892578125, -0.30438232421875, -0.2706756591796875, -0.236968994140625, -0.2032623291015625, -0.1695556640625, -0.1358489990234375, -0.102142333984375, -0.0684356689453125, -0.03472900390625, -0.0010223388671875, 0.032684326171875, 0.0663909912109375, 0.10009765625, 0.1338043212890625, 0.167510986328125, 0.2012176513671875, 0.23492431640625, 0.2686309814453125, 0.302337646484375, 0.3360443115234375, 0.3697509765625, 0.4034576416015625, 0.437164306640625, 0.4708709716796875, 0.50457763671875, 0.5382843017578125, 0.571990966796875, 0.6056976318359375, 0.639404296875, 0.6731109619140625, 0.706817626953125, 0.7405242919921875, 0.77423095703125, 0.8079376220703125, 0.841644287109375, 0.8753509521484375, 0.9090576171875, 0.9427642822265625, 0.976470947265625, 1.0101776123046875, 1.04388427734375, 1.0775909423828125, 1.111297607421875, 1.1450042724609375, 1.1787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 16.0, 44.0, 88.0, 209.0, 818.0, 17675.0, 1022860.0, 6027.0, 510.0, 158.0, 88.0, 28.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.3785400390625, -3.245361328125, -3.1121826171875, -2.97900390625, -2.8458251953125, -2.712646484375, -2.5794677734375, -2.4462890625, -2.3131103515625, -2.179931640625, -2.0467529296875, -1.91357421875, -1.7803955078125, -1.647216796875, -1.5140380859375, -1.380859375, -1.2476806640625, -1.114501953125, -0.9813232421875, -0.84814453125, -0.7149658203125, -0.581787109375, -0.4486083984375, -0.3154296875, -0.1822509765625, -0.049072265625, 0.0841064453125, 0.21728515625, 0.3504638671875, 0.483642578125, 0.6168212890625, 0.75, 0.8831787109375, 1.016357421875, 1.1495361328125, 1.28271484375, 1.4158935546875, 1.549072265625, 1.6822509765625, 1.8154296875, 1.9486083984375, 2.081787109375, 2.2149658203125, 2.34814453125, 2.4813232421875, 2.614501953125, 2.7476806640625, 2.880859375, 3.0140380859375, 3.147216796875, 3.2803955078125, 3.41357421875, 3.5467529296875, 3.679931640625, 3.8131103515625, 3.9462890625, 4.0794677734375, 4.212646484375, 4.3458251953125, 4.47900390625, 4.6121826171875, 4.745361328125, 4.8785400390625, 5.01171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 18.0, 22.0, 39.0, 72.0, 114.0, 167.0, 213.0, 135.0, 87.0, 42.0, 33.0, 22.0, 11.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002493858337402344, -0.00024287402629852295, -0.00023636221885681152, -0.0002298504114151001, -0.00022333860397338867, -0.00021682679653167725, -0.00021031498908996582, -0.0002038031816482544, -0.00019729137420654297, -0.00019077956676483154, -0.00018426775932312012, -0.0001777559518814087, -0.00017124414443969727, -0.00016473233699798584, -0.00015822052955627441, -0.000151708722114563, -0.00014519691467285156, -0.00013868510723114014, -0.0001321732997894287, -0.00012566149234771729, -0.00011914968490600586, -0.00011263787746429443, -0.00010612607002258301, -9.961426258087158e-05, -9.310245513916016e-05, -8.659064769744873e-05, -8.00788402557373e-05, -7.356703281402588e-05, -6.705522537231445e-05, -6.054341793060303e-05, -5.40316104888916e-05, -4.7519803047180176e-05, -4.100799560546875e-05, -3.4496188163757324e-05, -2.79843807220459e-05, -2.1472573280334473e-05, -1.4960765838623047e-05, -8.448958396911621e-06, -1.9371509552001953e-06, 4.5746564865112305e-06, 1.1086463928222656e-05, 1.7598271369934082e-05, 2.4110078811645508e-05, 3.0621886253356934e-05, 3.713369369506836e-05, 4.3645501136779785e-05, 5.015730857849121e-05, 5.666911602020264e-05, 6.318092346191406e-05, 6.969273090362549e-05, 7.620453834533691e-05, 8.271634578704834e-05, 8.922815322875977e-05, 9.573996067047119e-05, 0.00010225176811218262, 0.00010876357555389404, 0.00011527538299560547, 0.0001217871904373169, 0.00012829899787902832, 0.00013481080532073975, 0.00014132261276245117, 0.0001478344202041626, 0.00015434622764587402, 0.00016085803508758545, 0.00016736984252929688]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 20.0, 52.0, 80.0, 199.0, 621.0, 8565.0, 1030102.0, 7949.0, 623.0, 181.0, 69.0, 43.0, 24.0, 12.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.7421875, -4.6005859375, -4.458984375, -4.3173828125, -4.17578125, -4.0341796875, -3.892578125, -3.7509765625, -3.609375, -3.4677734375, -3.326171875, -3.1845703125, -3.04296875, -2.9013671875, -2.759765625, -2.6181640625, -2.4765625, -2.3349609375, -2.193359375, -2.0517578125, -1.91015625, -1.7685546875, -1.626953125, -1.4853515625, -1.34375, -1.2021484375, -1.060546875, -0.9189453125, -0.77734375, -0.6357421875, -0.494140625, -0.3525390625, -0.2109375, -0.0693359375, 0.072265625, 0.2138671875, 0.35546875, 0.4970703125, 0.638671875, 0.7802734375, 0.921875, 1.0634765625, 1.205078125, 1.3466796875, 1.48828125, 1.6298828125, 1.771484375, 1.9130859375, 2.0546875, 2.1962890625, 2.337890625, 2.4794921875, 2.62109375, 2.7626953125, 2.904296875, 3.0458984375, 3.1875, 3.3291015625, 3.470703125, 3.6123046875, 3.75390625, 3.8955078125, 4.037109375, 4.1787109375, 4.3203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 24.0, 96.0, 417.0, 339.0, 85.0, 26.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.4324951171875, -2.351318359375, -2.2701416015625, -2.18896484375, -2.1077880859375, -2.026611328125, -1.9454345703125, -1.8642578125, -1.7830810546875, -1.701904296875, -1.6207275390625, -1.53955078125, -1.4583740234375, -1.377197265625, -1.2960205078125, -1.21484375, -1.1336669921875, -1.052490234375, -0.9713134765625, -0.89013671875, -0.8089599609375, -0.727783203125, -0.6466064453125, -0.5654296875, -0.4842529296875, -0.403076171875, -0.3218994140625, -0.24072265625, -0.1595458984375, -0.078369140625, 0.0028076171875, 0.083984375, 0.1651611328125, 0.246337890625, 0.3275146484375, 0.40869140625, 0.4898681640625, 0.571044921875, 0.6522216796875, 0.7333984375, 0.8145751953125, 0.895751953125, 0.9769287109375, 1.05810546875, 1.1392822265625, 1.220458984375, 1.3016357421875, 1.3828125, 1.4639892578125, 1.545166015625, 1.6263427734375, 1.70751953125, 1.7886962890625, 1.869873046875, 1.9510498046875, 2.0322265625, 2.1134033203125, 2.194580078125, 2.2757568359375, 2.35693359375, 2.4381103515625, 2.519287109375, 2.6004638671875, 2.681640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 26.0, 86.0, 277.0, 347.0, 171.0, 63.0, 17.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.4338264465332, -36.72834777832031, -36.02286911010742, -35.31739044189453, -34.61191177368164, -33.90643310546875, -33.200950622558594, -32.4954719543457, -31.789993286132812, -31.084514617919922, -30.37903594970703, -29.67355728149414, -28.968076705932617, -28.262598037719727, -27.557119369506836, -26.851640701293945, -26.146162033081055, -25.440683364868164, -24.735204696655273, -24.02972412109375, -23.32424545288086, -22.61876678466797, -21.913288116455078, -21.207809448242188, -20.502330780029297, -19.796852111816406, -19.091373443603516, -18.385894775390625, -17.6804141998291, -16.97493553161621, -16.26945686340332, -15.56397819519043, -14.858497619628906, -14.153018951416016, -13.447539329528809, -12.742060661315918, -12.036581039428711, -11.33110237121582, -10.62562370300293, -9.920145034790039, -9.214665412902832, -8.509186744689941, -7.803707122802734, -7.098228454589844, -6.392749309539795, -5.687270164489746, -4.9817914962768555, -4.276312351226807, -3.570833206176758, -2.865354061126709, -2.1598751544952393, -1.4543962478637695, -0.7489171028137207, -0.043437957763671875, 0.6620407104492188, 1.3675198554992676, 2.0729990005493164, 2.7784781455993652, 3.483957052230835, 4.189435958862305, 4.8949151039123535, 5.600394248962402, 6.305872917175293, 7.011352062225342, 7.716831207275391]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 6.0, 13.0, 17.0, 4.0, 13.0, 24.0, 17.0, 24.0, 27.0, 28.0, 30.0, 38.0, 43.0, 44.0, 50.0, 41.0, 38.0, 53.0, 36.0, 39.0, 44.0, 36.0, 36.0, 39.0, 34.0, 35.0, 27.0, 18.0, 18.0, 19.0, 16.0, 15.0, 7.0, 14.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.314615726470947, -5.158224582672119, -5.001832962036133, -4.845441818237305, -4.689050674438477, -4.532659530639648, -4.376267910003662, -4.219876766204834, -4.063485145568848, -3.9070937633514404, -3.7507026195526123, -3.594311237335205, -3.437920093536377, -3.2815287113189697, -3.1251373291015625, -2.9687461853027344, -2.8123550415039062, -2.655963659286499, -2.499572515487671, -2.3431811332702637, -2.1867899894714355, -2.0303986072540283, -1.874007225036621, -1.7176159620285034, -1.5612246990203857, -1.404833436012268, -1.2484421730041504, -1.0920507907867432, -0.9356595277786255, -0.7792682647705078, -0.6228769421577454, -0.4664856195449829, -0.31009387969970703, -0.15370258688926697, 0.0026887059211730957, 0.15907999873161316, 0.3154712915420532, 0.4718625545501709, 0.6282538771629333, 0.7846451997756958, 0.9410364627838135, 1.0974277257919312, 1.2538189888000488, 1.410210371017456, 1.5666016340255737, 1.7229928970336914, 1.8793842792510986, 2.035775661468506, 2.192166805267334, 2.348558187484741, 2.5049493312835693, 2.6613407135009766, 2.8177318572998047, 2.974123239517212, 3.130514621734619, 3.2869057655334473, 3.4432971477508545, 3.5996885299682617, 3.75607967376709, 3.912471055984497, 4.068862438201904, 4.225253582000732, 4.3816447257995605, 4.538036346435547, 4.694427490234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 11.0, 14.0, 18.0, 21.0, 35.0, 56.0, 74.0, 137.0, 215.0, 485.0, 1201.0, 3802.0, 16340.0, 201843.0, 3913791.0, 44584.0, 7808.0, 2276.0, 829.0, 335.0, 177.0, 88.0, 51.0, 31.0, 19.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.642578125, -3.554290771484375, -3.46600341796875, -3.377716064453125, -3.2894287109375, -3.201141357421875, -3.11285400390625, -3.024566650390625, -2.936279296875, -2.847991943359375, -2.75970458984375, -2.671417236328125, -2.5831298828125, -2.494842529296875, -2.40655517578125, -2.318267822265625, -2.22998046875, -2.141693115234375, -2.05340576171875, -1.965118408203125, -1.8768310546875, -1.788543701171875, -1.70025634765625, -1.611968994140625, -1.523681640625, -1.435394287109375, -1.34710693359375, -1.258819580078125, -1.1705322265625, -1.082244873046875, -0.99395751953125, -0.905670166015625, -0.8173828125, -0.729095458984375, -0.64080810546875, -0.552520751953125, -0.4642333984375, -0.375946044921875, -0.28765869140625, -0.199371337890625, -0.111083984375, -0.022796630859375, 0.06549072265625, 0.153778076171875, 0.2420654296875, 0.330352783203125, 0.41864013671875, 0.506927490234375, 0.59521484375, 0.683502197265625, 0.77178955078125, 0.860076904296875, 0.9483642578125, 1.036651611328125, 1.12493896484375, 1.213226318359375, 1.301513671875, 1.389801025390625, 1.47808837890625, 1.566375732421875, 1.6546630859375, 1.742950439453125, 1.83123779296875, 1.919525146484375, 2.0078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 13.0, 17.0, 21.0, 20.0, 21.0, 33.0, 42.0, 50.0, 67.0, 65.0, 57.0, 62.0, 68.0, 62.0, 70.0, 60.0, 61.0, 52.0, 30.0, 28.0, 29.0, 25.0, 11.0, 13.0, 8.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.440673828125, -0.42914581298828125, -0.4176177978515625, -0.40608978271484375, -0.394561767578125, -0.38303375244140625, -0.3715057373046875, -0.35997772216796875, -0.34844970703125, -0.33692169189453125, -0.3253936767578125, -0.31386566162109375, -0.302337646484375, -0.29080963134765625, -0.2792816162109375, -0.26775360107421875, -0.2562255859375, -0.24469757080078125, -0.2331695556640625, -0.22164154052734375, -0.210113525390625, -0.19858551025390625, -0.1870574951171875, -0.17552947998046875, -0.16400146484375, -0.15247344970703125, -0.1409454345703125, -0.12941741943359375, -0.117889404296875, -0.10636138916015625, -0.0948333740234375, -0.08330535888671875, -0.07177734375, -0.06024932861328125, -0.0487213134765625, -0.03719329833984375, -0.025665283203125, -0.01413726806640625, -0.0026092529296875, 0.00891876220703125, 0.02044677734375, 0.03197479248046875, 0.0435028076171875, 0.05503082275390625, 0.066558837890625, 0.07808685302734375, 0.0896148681640625, 0.10114288330078125, 0.1126708984375, 0.12419891357421875, 0.1357269287109375, 0.14725494384765625, 0.158782958984375, 0.17031097412109375, 0.1818389892578125, 0.19336700439453125, 0.20489501953125, 0.21642303466796875, 0.2279510498046875, 0.23947906494140625, 0.251007080078125, 0.26253509521484375, 0.2740631103515625, 0.28559112548828125, 0.297119140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 0.0, 11.0, 11.0, 11.0, 19.0, 44.0, 62.0, 82.0, 107.0, 152.0, 256.0, 636.0, 2453.0, 26626.0, 4112781.0, 46305.0, 3125.0, 748.0, 299.0, 165.0, 120.0, 84.0, 71.0, 44.0, 23.0, 25.0, 13.0, 10.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.52423095703125, -5.3492431640625, -5.17425537109375, -4.999267578125, -4.82427978515625, -4.6492919921875, -4.47430419921875, -4.29931640625, -4.12432861328125, -3.9493408203125, -3.77435302734375, -3.599365234375, -3.42437744140625, -3.2493896484375, -3.07440185546875, -2.8994140625, -2.72442626953125, -2.5494384765625, -2.37445068359375, -2.199462890625, -2.02447509765625, -1.8494873046875, -1.67449951171875, -1.49951171875, -1.32452392578125, -1.1495361328125, -0.97454833984375, -0.799560546875, -0.62457275390625, -0.4495849609375, -0.27459716796875, -0.099609375, 0.07537841796875, 0.2503662109375, 0.42535400390625, 0.600341796875, 0.77532958984375, 0.9503173828125, 1.12530517578125, 1.30029296875, 1.47528076171875, 1.6502685546875, 1.82525634765625, 2.000244140625, 2.17523193359375, 2.3502197265625, 2.52520751953125, 2.7001953125, 2.87518310546875, 3.0501708984375, 3.22515869140625, 3.400146484375, 3.57513427734375, 3.7501220703125, 3.92510986328125, 4.10009765625, 4.27508544921875, 4.4500732421875, 4.62506103515625, 4.800048828125, 4.97503662109375, 5.1500244140625, 5.32501220703125, 5.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 14.0, 38.0, 130.0, 2249.0, 1502.0, 91.0, 32.0, 13.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.930389404296875, -1.85882568359375, -1.787261962890625, -1.7156982421875, -1.644134521484375, -1.57257080078125, -1.501007080078125, -1.429443359375, -1.357879638671875, -1.28631591796875, -1.214752197265625, -1.1431884765625, -1.071624755859375, -1.00006103515625, -0.928497314453125, -0.85693359375, -0.785369873046875, -0.71380615234375, -0.642242431640625, -0.5706787109375, -0.499114990234375, -0.42755126953125, -0.355987548828125, -0.284423828125, -0.212860107421875, -0.14129638671875, -0.069732666015625, 0.0018310546875, 0.073394775390625, 0.14495849609375, 0.216522216796875, 0.2880859375, 0.359649658203125, 0.43121337890625, 0.502777099609375, 0.5743408203125, 0.645904541015625, 0.71746826171875, 0.789031982421875, 0.860595703125, 0.932159423828125, 1.00372314453125, 1.075286865234375, 1.1468505859375, 1.218414306640625, 1.28997802734375, 1.361541748046875, 1.43310546875, 1.504669189453125, 1.57623291015625, 1.647796630859375, 1.7193603515625, 1.790924072265625, 1.86248779296875, 1.934051513671875, 2.005615234375, 2.077178955078125, 2.14874267578125, 2.220306396484375, 2.2918701171875, 2.363433837890625, 2.43499755859375, 2.506561279296875, 2.578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 15.0, 22.0, 49.0, 141.0, 279.0, 247.0, 123.0, 66.0, 29.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.467264175415039, -6.251947402954102, -6.036631107330322, -5.821314334869385, -5.6059980392456055, -5.390681266784668, -5.175364971160889, -4.960048198699951, -4.744731903076172, -4.529415130615234, -4.314098834991455, -4.098782062530518, -3.8834657669067383, -3.668148994445801, -3.4528326988220215, -3.237515926361084, -3.0221993923187256, -2.806882858276367, -2.591566324234009, -2.3762497901916504, -2.160933256149292, -1.945616602897644, -1.7303000688552856, -1.5149835348129272, -1.2996670007705688, -1.0843504667282104, -0.869033932685852, -0.6537173390388489, -0.4384008049964905, -0.2230842113494873, -0.007767677307128906, 0.2075488567352295, 0.4228653907775879, 0.6381819248199463, 0.8534984588623047, 1.068814992904663, 1.2841315269470215, 1.4994481801986694, 1.7147647142410278, 1.9300812482833862, 2.145397663116455, 2.3607141971588135, 2.576030731201172, 2.7913472652435303, 3.0066637992858887, 3.221980571746826, 3.4372968673706055, 3.652613639831543, 3.8679301738739014, 4.08324670791626, 4.298563480377197, 4.513879776000977, 4.729196548461914, 4.944512844085693, 5.159829616546631, 5.37514591217041, 5.590462684631348, 5.805779457092285, 6.0210957527160645, 6.236412525177002, 6.451728820800781, 6.667045593261719, 6.882361888885498, 7.0976786613464355, 7.312994956970215]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 21.0, 33.0, 62.0, 83.0, 103.0, 117.0, 118.0, 126.0, 103.0, 77.0, 50.0, 27.0, 31.0, 21.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5036702156066895, -5.349239349365234, -5.194808006286621, -5.040376663208008, -4.885945796966553, -4.731514930725098, -4.577083587646484, -4.422652244567871, -4.268221378326416, -4.113790512084961, -3.9593591690063477, -3.8049280643463135, -3.6504969596862793, -3.496065855026245, -3.341634750366211, -3.1872036457061768, -3.0327725410461426, -2.8783414363861084, -2.723910331726074, -2.56947922706604, -2.415048122406006, -2.2606170177459717, -2.1061859130859375, -1.9517548084259033, -1.7973237037658691, -1.642892599105835, -1.4884614944458008, -1.3340303897857666, -1.1795992851257324, -1.0251681804656982, -0.8707370758056641, -0.7163059711456299, -0.5618753433227539, -0.4074442386627197, -0.25301313400268555, -0.09858202934265137, 0.05584907531738281, 0.210280179977417, 0.36471128463745117, 0.5191423892974854, 0.6735734939575195, 0.8280045986175537, 0.9824357032775879, 1.136866807937622, 1.2912979125976562, 1.4457290172576904, 1.6001601219177246, 1.7545912265777588, 1.909022331237793, 2.063453435897827, 2.2178845405578613, 2.3723156452178955, 2.5267467498779297, 2.681177854537964, 2.835608959197998, 2.9900400638580322, 3.1444711685180664, 3.2989022731781006, 3.4533333778381348, 3.607764482498169, 3.762195587158203, 3.9166266918182373, 4.0710577964782715, 4.225488662719727, 4.37992000579834]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 1.0, 10.0, 18.0, 27.0, 32.0, 68.0, 144.0, 266.0, 818.0, 3570.0, 35419.0, 774144.0, 220485.0, 10932.0, 1678.0, 497.0, 188.0, 105.0, 56.0, 29.0, 22.0, 15.0, 7.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5703125, -4.460906982421875, -4.35150146484375, -4.242095947265625, -4.1326904296875, -4.023284912109375, -3.91387939453125, -3.804473876953125, -3.695068359375, -3.585662841796875, -3.47625732421875, -3.366851806640625, -3.2574462890625, -3.148040771484375, -3.03863525390625, -2.929229736328125, -2.81982421875, -2.710418701171875, -2.60101318359375, -2.491607666015625, -2.3822021484375, -2.272796630859375, -2.16339111328125, -2.053985595703125, -1.944580078125, -1.835174560546875, -1.72576904296875, -1.616363525390625, -1.5069580078125, -1.397552490234375, -1.28814697265625, -1.178741455078125, -1.0693359375, -0.959930419921875, -0.85052490234375, -0.741119384765625, -0.6317138671875, -0.522308349609375, -0.41290283203125, -0.303497314453125, -0.194091796875, -0.084686279296875, 0.02471923828125, 0.134124755859375, 0.2435302734375, 0.352935791015625, 0.46234130859375, 0.571746826171875, 0.68115234375, 0.790557861328125, 0.89996337890625, 1.009368896484375, 1.1187744140625, 1.228179931640625, 1.33758544921875, 1.446990966796875, 1.556396484375, 1.665802001953125, 1.77520751953125, 1.884613037109375, 1.9940185546875, 2.103424072265625, 2.21282958984375, 2.322235107421875, 2.431640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 20.0, 18.0, 21.0, 41.0, 58.0, 69.0, 77.0, 82.0, 85.0, 85.0, 74.0, 75.0, 63.0, 63.0, 31.0, 34.0, 25.0, 23.0, 17.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5784912109375, -0.563720703125, -0.5489501953125, -0.5341796875, -0.5194091796875, -0.504638671875, -0.4898681640625, -0.47509765625, -0.4603271484375, -0.445556640625, -0.4307861328125, -0.416015625, -0.4012451171875, -0.386474609375, -0.3717041015625, -0.35693359375, -0.3421630859375, -0.327392578125, -0.3126220703125, -0.2978515625, -0.2830810546875, -0.268310546875, -0.2535400390625, -0.23876953125, -0.2239990234375, -0.209228515625, -0.1944580078125, -0.1796875, -0.1649169921875, -0.150146484375, -0.1353759765625, -0.12060546875, -0.1058349609375, -0.091064453125, -0.0762939453125, -0.0615234375, -0.0467529296875, -0.031982421875, -0.0172119140625, -0.00244140625, 0.0123291015625, 0.027099609375, 0.0418701171875, 0.056640625, 0.0714111328125, 0.086181640625, 0.1009521484375, 0.11572265625, 0.1304931640625, 0.145263671875, 0.1600341796875, 0.1748046875, 0.1895751953125, 0.204345703125, 0.2191162109375, 0.23388671875, 0.2486572265625, 0.263427734375, 0.2781982421875, 0.29296875, 0.3077392578125, 0.322509765625, 0.3372802734375, 0.35205078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 10.0, 17.0, 17.0, 9.0, 30.0, 29.0, 53.0, 73.0, 144.0, 259.0, 722.0, 2454.0, 10843.0, 66950.0, 488243.0, 411068.0, 55003.0, 9162.0, 2194.0, 653.0, 254.0, 120.0, 76.0, 46.0, 29.0, 18.0, 12.0, 10.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.31927490234375, -1.2684326171875, -1.21759033203125, -1.166748046875, -1.11590576171875, -1.0650634765625, -1.01422119140625, -0.96337890625, -0.91253662109375, -0.8616943359375, -0.81085205078125, -0.760009765625, -0.70916748046875, -0.6583251953125, -0.60748291015625, -0.556640625, -0.50579833984375, -0.4549560546875, -0.40411376953125, -0.353271484375, -0.30242919921875, -0.2515869140625, -0.20074462890625, -0.14990234375, -0.09906005859375, -0.0482177734375, 0.00262451171875, 0.053466796875, 0.10430908203125, 0.1551513671875, 0.20599365234375, 0.2568359375, 0.30767822265625, 0.3585205078125, 0.40936279296875, 0.460205078125, 0.51104736328125, 0.5618896484375, 0.61273193359375, 0.66357421875, 0.71441650390625, 0.7652587890625, 0.81610107421875, 0.866943359375, 0.91778564453125, 0.9686279296875, 1.01947021484375, 1.0703125, 1.12115478515625, 1.1719970703125, 1.22283935546875, 1.273681640625, 1.32452392578125, 1.3753662109375, 1.42620849609375, 1.47705078125, 1.52789306640625, 1.5787353515625, 1.62957763671875, 1.680419921875, 1.73126220703125, 1.7821044921875, 1.83294677734375, 1.8837890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 8.0, 20.0, 19.0, 25.0, 30.0, 30.0, 32.0, 44.0, 35.0, 34.0, 53.0, 39.0, 47.0, 44.0, 59.0, 41.0, 49.0, 35.0, 37.0, 38.0, 38.0, 29.0, 21.0, 32.0, 23.0, 17.0, 22.0, 6.0, 16.0, 10.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9002914428710938, -0.8665008544921875, -0.8327102661132812, -0.798919677734375, -0.7651290893554688, -0.7313385009765625, -0.6975479125976562, -0.66375732421875, -0.6299667358398438, -0.5961761474609375, -0.5623855590820312, -0.528594970703125, -0.49480438232421875, -0.4610137939453125, -0.42722320556640625, -0.3934326171875, -0.35964202880859375, -0.3258514404296875, -0.29206085205078125, -0.258270263671875, -0.22447967529296875, -0.1906890869140625, -0.15689849853515625, -0.12310791015625, -0.08931732177734375, -0.0555267333984375, -0.02173614501953125, 0.012054443359375, 0.04584503173828125, 0.0796356201171875, 0.11342620849609375, 0.147216796875, 0.18100738525390625, 0.2147979736328125, 0.24858856201171875, 0.282379150390625, 0.31616973876953125, 0.3499603271484375, 0.38375091552734375, 0.41754150390625, 0.45133209228515625, 0.4851226806640625, 0.5189132690429688, 0.552703857421875, 0.5864944458007812, 0.6202850341796875, 0.6540756225585938, 0.6878662109375, 0.7216567993164062, 0.7554473876953125, 0.7892379760742188, 0.823028564453125, 0.8568191528320312, 0.8906097412109375, 0.9244003295898438, 0.95819091796875, 0.9919815063476562, 1.0257720947265625, 1.0595626831054688, 1.093353271484375, 1.1271438598632812, 1.1609344482421875, 1.1947250366210938, 1.228515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 12.0, 12.0, 23.0, 27.0, 45.0, 79.0, 168.0, 293.0, 620.0, 1551.0, 4887.0, 24093.0, 206654.0, 667490.0, 120611.0, 15813.0, 3740.0, 1288.0, 539.0, 271.0, 137.0, 80.0, 40.0, 27.0, 17.0, 8.0, 9.0, 2.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.49745941162109375, -0.4792938232421875, -0.46112823486328125, -0.442962646484375, -0.42479705810546875, -0.4066314697265625, -0.38846588134765625, -0.37030029296875, -0.35213470458984375, -0.3339691162109375, -0.31580352783203125, -0.297637939453125, -0.27947235107421875, -0.2613067626953125, -0.24314117431640625, -0.2249755859375, -0.20680999755859375, -0.1886444091796875, -0.17047882080078125, -0.152313232421875, -0.13414764404296875, -0.1159820556640625, -0.09781646728515625, -0.07965087890625, -0.06148529052734375, -0.0433197021484375, -0.02515411376953125, -0.006988525390625, 0.01117706298828125, 0.0293426513671875, 0.04750823974609375, 0.065673828125, 0.08383941650390625, 0.1020050048828125, 0.12017059326171875, 0.138336181640625, 0.15650177001953125, 0.1746673583984375, 0.19283294677734375, 0.21099853515625, 0.22916412353515625, 0.2473297119140625, 0.26549530029296875, 0.283660888671875, 0.30182647705078125, 0.3199920654296875, 0.33815765380859375, 0.3563232421875, 0.37448883056640625, 0.3926544189453125, 0.41082000732421875, 0.428985595703125, 0.44715118408203125, 0.4653167724609375, 0.48348236083984375, 0.50164794921875, 0.5198135375976562, 0.5379791259765625, 0.5561447143554688, 0.574310302734375, 0.5924758911132812, 0.6106414794921875, 0.6288070678710938, 0.64697265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 9.0, 8.0, 17.0, 16.0, 32.0, 39.0, 51.0, 82.0, 125.0, 153.0, 138.0, 96.0, 81.0, 49.0, 34.0, 16.0, 17.0, 11.0, 10.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015926361083984375, -0.00015561282634735107, -0.0001519620418548584, -0.00014831125736236572, -0.00014466047286987305, -0.00014100968837738037, -0.0001373589038848877, -0.00013370811939239502, -0.00013005733489990234, -0.00012640655040740967, -0.000122755765914917, -0.00011910498142242432, -0.00011545419692993164, -0.00011180341243743896, -0.00010815262794494629, -0.00010450184345245361, -0.00010085105895996094, -9.720027446746826e-05, -9.354948997497559e-05, -8.989870548248291e-05, -8.624792098999023e-05, -8.259713649749756e-05, -7.894635200500488e-05, -7.529556751251221e-05, -7.164478302001953e-05, -6.799399852752686e-05, -6.434321403503418e-05, -6.0692429542541504e-05, -5.704164505004883e-05, -5.339086055755615e-05, -4.9740076065063477e-05, -4.60892915725708e-05, -4.2438507080078125e-05, -3.878772258758545e-05, -3.5136938095092773e-05, -3.14861536026001e-05, -2.7835369110107422e-05, -2.4184584617614746e-05, -2.053380012512207e-05, -1.6883015632629395e-05, -1.3232231140136719e-05, -9.581446647644043e-06, -5.930662155151367e-06, -2.2798776626586914e-06, 1.3709068298339844e-06, 5.02169132232666e-06, 8.672475814819336e-06, 1.2323260307312012e-05, 1.5974044799804688e-05, 1.9624829292297363e-05, 2.327561378479004e-05, 2.6926398277282715e-05, 3.057718276977539e-05, 3.4227967262268066e-05, 3.787875175476074e-05, 4.152953624725342e-05, 4.5180320739746094e-05, 4.883110523223877e-05, 5.2481889724731445e-05, 5.613267421722412e-05, 5.97834587097168e-05, 6.343424320220947e-05, 6.708502769470215e-05, 7.073581218719482e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 5.0, 10.0, 5.0, 10.0, 20.0, 33.0, 70.0, 161.0, 364.0, 1170.0, 4589.0, 30293.0, 412589.0, 551910.0, 39579.0, 5544.0, 1354.0, 488.0, 171.0, 77.0, 49.0, 23.0, 15.0, 9.0, 3.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0126953125, -0.9891777038574219, -0.9656600952148438, -0.9421424865722656, -0.9186248779296875, -0.8951072692871094, -0.8715896606445312, -0.8480720520019531, -0.824554443359375, -0.8010368347167969, -0.7775192260742188, -0.7540016174316406, -0.7304840087890625, -0.7069664001464844, -0.6834487915039062, -0.6599311828613281, -0.63641357421875, -0.6128959655761719, -0.5893783569335938, -0.5658607482910156, -0.5423431396484375, -0.5188255310058594, -0.49530792236328125, -0.4717903137207031, -0.448272705078125, -0.4247550964355469, -0.40123748779296875, -0.3777198791503906, -0.3542022705078125, -0.3306846618652344, -0.30716705322265625, -0.2836494445800781, -0.2601318359375, -0.23661422729492188, -0.21309661865234375, -0.18957901000976562, -0.1660614013671875, -0.14254379272460938, -0.11902618408203125, -0.09550857543945312, -0.071990966796875, -0.048473358154296875, -0.02495574951171875, -0.001438140869140625, 0.0220794677734375, 0.045597076416015625, 0.06911468505859375, 0.09263229370117188, 0.11614990234375, 0.13966751098632812, 0.16318511962890625, 0.18670272827148438, 0.2102203369140625, 0.23373794555664062, 0.25725555419921875, 0.2807731628417969, 0.304290771484375, 0.3278083801269531, 0.35132598876953125, 0.3748435974121094, 0.3983612060546875, 0.4218788146972656, 0.44539642333984375, 0.4689140319824219, 0.492431640625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 17.0, 12.0, 15.0, 25.0, 22.0, 49.0, 71.0, 86.0, 116.0, 114.0, 112.0, 99.0, 69.0, 55.0, 30.0, 30.0, 18.0, 15.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.533203125, -0.5189895629882812, -0.5047760009765625, -0.49056243896484375, -0.476348876953125, -0.46213531494140625, -0.4479217529296875, -0.43370819091796875, -0.41949462890625, -0.40528106689453125, -0.3910675048828125, -0.37685394287109375, -0.362640380859375, -0.34842681884765625, -0.3342132568359375, -0.31999969482421875, -0.3057861328125, -0.29157257080078125, -0.2773590087890625, -0.26314544677734375, -0.248931884765625, -0.23471832275390625, -0.2205047607421875, -0.20629119873046875, -0.19207763671875, -0.17786407470703125, -0.1636505126953125, -0.14943695068359375, -0.135223388671875, -0.12100982666015625, -0.1067962646484375, -0.09258270263671875, -0.078369140625, -0.06415557861328125, -0.0499420166015625, -0.03572845458984375, -0.021514892578125, -0.00730133056640625, 0.0069122314453125, 0.02112579345703125, 0.03533935546875, 0.04955291748046875, 0.0637664794921875, 0.07798004150390625, 0.092193603515625, 0.10640716552734375, 0.1206207275390625, 0.13483428955078125, 0.1490478515625, 0.16326141357421875, 0.1774749755859375, 0.19168853759765625, 0.205902099609375, 0.22011566162109375, 0.2343292236328125, 0.24854278564453125, 0.26275634765625, 0.27696990966796875, 0.2911834716796875, 0.30539703369140625, 0.319610595703125, 0.33382415771484375, 0.3480377197265625, 0.36225128173828125, 0.37646484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 13.0, 24.0, 43.0, 83.0, 110.0, 169.0, 162.0, 141.0, 121.0, 58.0, 39.0, 17.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.583742618560791, -5.280097007751465, -4.976451396942139, -4.6728057861328125, -4.369159698486328, -4.06551456451416, -3.761868476867676, -3.4582228660583496, -3.1545772552490234, -2.8509316444396973, -2.547286033630371, -2.243640184402466, -1.9399945735931396, -1.6363489627838135, -1.3327032327651978, -1.029057502746582, -0.7254118919372559, -0.4217662215232849, -0.11812055110931396, 0.18552511930465698, 0.48917078971862793, 0.7928164005279541, 1.0964621305465698, 1.4001078605651855, 1.7037534713745117, 2.007399082183838, 2.311044692993164, 2.6146905422210693, 2.9183361530303955, 3.2219817638397217, 3.525627613067627, 3.829273223876953, 4.1329193115234375, 4.436564922332764, 4.74021053314209, 5.043856143951416, 5.347501754760742, 5.651147842407227, 5.954793453216553, 6.258439064025879, 6.562084674835205, 6.865730285644531, 7.169375896453857, 7.473021507263184, 7.776667594909668, 8.080312728881836, 8.38395881652832, 8.687604904174805, 8.991250038146973, 9.294896125793457, 9.598541259765625, 9.90218734741211, 10.205832481384277, 10.509478569030762, 10.81312370300293, 11.116769790649414, 11.420415878295898, 11.724061965942383, 12.02770709991455, 12.331353187561035, 12.634998321533203, 12.938644409179688, 13.242289543151855, 13.54593563079834, 13.849580764770508]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 1.0, 8.0, 11.0, 14.0, 6.0, 8.0, 11.0, 16.0, 17.0, 15.0, 26.0, 27.0, 23.0, 21.0, 34.0, 27.0, 22.0, 29.0, 44.0, 36.0, 25.0, 45.0, 42.0, 42.0, 34.0, 40.0, 44.0, 29.0, 30.0, 27.0, 28.0, 25.0, 23.0, 21.0, 20.0, 15.0, 24.0, 13.0, 14.0, 5.0, 6.0, 13.0, 8.0, 4.0, 7.0, 8.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.377024173736572, -4.24040412902832, -4.103784084320068, -3.9671640396118164, -3.8305439949035645, -3.6939239501953125, -3.5573041439056396, -3.4206840991973877, -3.2840640544891357, -3.147444009780884, -3.010823965072632, -2.87420392036438, -2.737584114074707, -2.600964069366455, -2.464344024658203, -2.327723979949951, -2.191103935241699, -2.0544838905334473, -1.9178638458251953, -1.781243920326233, -1.644623875617981, -1.508003830909729, -1.3713839054107666, -1.2347638607025146, -1.0981438159942627, -0.9615237712860107, -0.8249037861824036, -0.6882838010787964, -0.5516637563705444, -0.4150437116622925, -0.2784237265586853, -0.14180374145507812, -0.005184173583984375, 0.1314358413219452, 0.26805585622787476, 0.4046758711338043, 0.5412958860397339, 0.6779159307479858, 0.814535915851593, 0.9511559009552002, 1.0877759456634521, 1.224395990371704, 1.361016035079956, 1.4976359605789185, 1.6342560052871704, 1.7708760499954224, 1.9074959754943848, 2.0441160202026367, 2.1807360649108887, 2.3173561096191406, 2.4539761543273926, 2.5905961990356445, 2.7272162437438965, 2.8638362884521484, 3.0004560947418213, 3.1370761394500732, 3.273696184158325, 3.410316228866577, 3.546936273574829, 3.683556318283081, 3.820176124572754, 3.956796169281006, 4.093416213989258, 4.23003625869751, 4.366656303405762]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 5.0, 15.0, 14.0, 13.0, 13.0, 23.0, 28.0, 38.0, 44.0, 69.0, 111.0, 163.0, 279.0, 555.0, 1147.0, 2822.0, 8206.0, 30196.0, 844059.0, 3257799.0, 33665.0, 8948.0, 3219.0, 1404.0, 625.0, 320.0, 196.0, 98.0, 72.0, 39.0, 34.0, 17.0, 12.0, 4.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.237884521484375, -4.13201904296875, -4.026153564453125, -3.9202880859375, -3.814422607421875, -3.70855712890625, -3.602691650390625, -3.496826171875, -3.390960693359375, -3.28509521484375, -3.179229736328125, -3.0733642578125, -2.967498779296875, -2.86163330078125, -2.755767822265625, -2.64990234375, -2.544036865234375, -2.43817138671875, -2.332305908203125, -2.2264404296875, -2.120574951171875, -2.01470947265625, -1.908843994140625, -1.802978515625, -1.697113037109375, -1.59124755859375, -1.485382080078125, -1.3795166015625, -1.273651123046875, -1.16778564453125, -1.061920166015625, -0.9560546875, -0.850189208984375, -0.74432373046875, -0.638458251953125, -0.5325927734375, -0.426727294921875, -0.32086181640625, -0.214996337890625, -0.109130859375, -0.003265380859375, 0.10260009765625, 0.208465576171875, 0.3143310546875, 0.420196533203125, 0.52606201171875, 0.631927490234375, 0.73779296875, 0.843658447265625, 0.94952392578125, 1.055389404296875, 1.1612548828125, 1.267120361328125, 1.37298583984375, 1.478851318359375, 1.584716796875, 1.690582275390625, 1.79644775390625, 1.902313232421875, 2.0081787109375, 2.114044189453125, 2.21990966796875, 2.325775146484375, 2.431640625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 8.0, 11.0, 9.0, 21.0, 20.0, 20.0, 43.0, 45.0, 60.0, 60.0, 69.0, 71.0, 73.0, 81.0, 60.0, 62.0, 59.0, 54.0, 32.0, 42.0, 35.0, 15.0, 14.0, 14.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.5498046875, -0.5359840393066406, -0.5221633911132812, -0.5083427429199219, -0.4945220947265625, -0.4807014465332031, -0.46688079833984375, -0.4530601501464844, -0.439239501953125, -0.4254188537597656, -0.41159820556640625, -0.3977775573730469, -0.3839569091796875, -0.3701362609863281, -0.35631561279296875, -0.3424949645996094, -0.32867431640625, -0.3148536682128906, -0.30103302001953125, -0.2872123718261719, -0.2733917236328125, -0.2595710754394531, -0.24575042724609375, -0.23192977905273438, -0.218109130859375, -0.20428848266601562, -0.19046783447265625, -0.17664718627929688, -0.1628265380859375, -0.14900588989257812, -0.13518524169921875, -0.12136459350585938, -0.1075439453125, -0.09372329711914062, -0.07990264892578125, -0.06608200073242188, -0.0522613525390625, -0.038440704345703125, -0.02462005615234375, -0.010799407958984375, 0.003021240234375, 0.016841888427734375, 0.03066253662109375, 0.044483184814453125, 0.0583038330078125, 0.07212448120117188, 0.08594512939453125, 0.09976577758789062, 0.11358642578125, 0.12740707397460938, 0.14122772216796875, 0.15504837036132812, 0.1688690185546875, 0.18268966674804688, 0.19651031494140625, 0.21033096313476562, 0.224151611328125, 0.23797225952148438, 0.25179290771484375, 0.2656135559082031, 0.2794342041015625, 0.2932548522949219, 0.30707550048828125, 0.3208961486816406, 0.334716796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 16.0, 6.0, 17.0, 31.0, 30.0, 42.0, 48.0, 79.0, 94.0, 119.0, 172.0, 251.0, 289.0, 485.0, 806.0, 1553.0, 3364.0, 8745.0, 31024.0, 252845.0, 3766816.0, 96374.0, 18960.0, 6149.0, 2509.0, 1264.0, 707.0, 400.0, 279.0, 198.0, 147.0, 96.0, 100.0, 70.0, 49.0, 35.0, 26.0, 18.0, 15.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.04736328125, -1.9775390625, -1.90771484375, -1.837890625, -1.76806640625, -1.6982421875, -1.62841796875, -1.55859375, -1.48876953125, -1.4189453125, -1.34912109375, -1.279296875, -1.20947265625, -1.1396484375, -1.06982421875, -1.0, -0.93017578125, -0.8603515625, -0.79052734375, -0.720703125, -0.65087890625, -0.5810546875, -0.51123046875, -0.44140625, -0.37158203125, -0.3017578125, -0.23193359375, -0.162109375, -0.09228515625, -0.0224609375, 0.04736328125, 0.1171875, 0.18701171875, 0.2568359375, 0.32666015625, 0.396484375, 0.46630859375, 0.5361328125, 0.60595703125, 0.67578125, 0.74560546875, 0.8154296875, 0.88525390625, 0.955078125, 1.02490234375, 1.0947265625, 1.16455078125, 1.234375, 1.30419921875, 1.3740234375, 1.44384765625, 1.513671875, 1.58349609375, 1.6533203125, 1.72314453125, 1.79296875, 1.86279296875, 1.9326171875, 2.00244140625, 2.072265625, 2.14208984375, 2.2119140625, 2.28173828125, 2.3515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 21.0, 29.0, 62.0, 174.0, 839.0, 2488.0, 223.0, 92.0, 45.0, 25.0, 13.0, 10.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.1660003662109375, -1.130828857421875, -1.0956573486328125, -1.06048583984375, -1.0253143310546875, -0.990142822265625, -0.9549713134765625, -0.9197998046875, -0.8846282958984375, -0.849456787109375, -0.8142852783203125, -0.77911376953125, -0.7439422607421875, -0.708770751953125, -0.6735992431640625, -0.638427734375, -0.6032562255859375, -0.568084716796875, -0.5329132080078125, -0.49774169921875, -0.4625701904296875, -0.427398681640625, -0.3922271728515625, -0.3570556640625, -0.3218841552734375, -0.286712646484375, -0.2515411376953125, -0.21636962890625, -0.1811981201171875, -0.146026611328125, -0.1108551025390625, -0.07568359375, -0.0405120849609375, -0.005340576171875, 0.0298309326171875, 0.06500244140625, 0.1001739501953125, 0.135345458984375, 0.1705169677734375, 0.2056884765625, 0.2408599853515625, 0.276031494140625, 0.3112030029296875, 0.34637451171875, 0.3815460205078125, 0.416717529296875, 0.4518890380859375, 0.487060546875, 0.5222320556640625, 0.557403564453125, 0.5925750732421875, 0.62774658203125, 0.6629180908203125, 0.698089599609375, 0.7332611083984375, 0.7684326171875, 0.8036041259765625, 0.838775634765625, 0.8739471435546875, 0.90911865234375, 0.9442901611328125, 0.979461669921875, 1.0146331787109375, 1.0498046875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 16.0, 33.0, 97.0, 300.0, 352.0, 145.0, 35.0, 12.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.955515384674072, -6.655892372131348, -6.356269359588623, -6.056646347045898, -5.757023811340332, -5.457400798797607, -5.157777786254883, -4.858155250549316, -4.558531761169434, -4.258908748626709, -3.9592859745025635, -3.659662961959839, -3.3600401878356934, -3.0604171752929688, -2.760794162750244, -2.4611713886260986, -2.161548614501953, -1.861925721168518, -1.562302827835083, -1.2626798152923584, -0.9630569219589233, -0.6634340286254883, -0.36381101608276367, -0.06418824195861816, 0.23543477058410645, 0.5350576639175415, 0.8346806168556213, 1.1343035697937012, 1.4339264631271362, 1.7335493564605713, 2.033172369003296, 2.3327951431274414, 2.632417678833008, 2.9320406913757324, 3.231663465499878, 3.5312864780426025, 3.830909252166748, 4.130532264709473, 4.430155277252197, 4.729778289794922, 5.029400825500488, 5.329023838043213, 5.6286468505859375, 5.928269386291504, 6.2278923988342285, 6.527515411376953, 6.827138423919678, 7.126761436462402, 7.426384449005127, 7.726007461547852, 8.025629997253418, 8.3252534866333, 8.624876022338867, 8.92449951171875, 9.224122047424316, 9.523744583129883, 9.823368072509766, 10.122990608215332, 10.422614097595215, 10.722236633300781, 11.021860122680664, 11.32148265838623, 11.621105194091797, 11.92072868347168, 12.220351219177246]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 13.0, 17.0, 17.0, 24.0, 38.0, 47.0, 71.0, 65.0, 70.0, 85.0, 87.0, 86.0, 84.0, 70.0, 53.0, 56.0, 26.0, 34.0, 16.0, 12.0, 5.0, 0.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.753364086151123, -3.634342670440674, -3.5153210163116455, -3.3962996006011963, -3.277278184890747, -3.1582565307617188, -3.0392351150512695, -2.9202136993408203, -2.801192283630371, -2.682170867919922, -2.5631492137908936, -2.4441277980804443, -2.325106382369995, -2.206084728240967, -2.0870633125305176, -1.9680418968200684, -1.8490203619003296, -1.7299988269805908, -1.6109774112701416, -1.4919558763504028, -1.3729344606399536, -1.2539129257202148, -1.1348915100097656, -1.0158699750900269, -0.8968484997749329, -0.7778270244598389, -0.6588055491447449, -0.5397840738296509, -0.4207625687122345, -0.3017410635948181, -0.18271958827972412, -0.06369811296463013, 0.05532336235046387, 0.17434483766555786, 0.29336631298065186, 0.41238781809806824, 0.5314092636108398, 0.6504307985305786, 0.7694522738456726, 0.8884737491607666, 1.0074951648712158, 1.1265166997909546, 1.2455381155014038, 1.3645596504211426, 1.4835810661315918, 1.6026026010513306, 1.7216241359710693, 1.8406455516815186, 1.9596670866012573, 2.078688621520996, 2.1977100372314453, 2.3167314529418945, 2.435753107070923, 2.554774522781372, 2.6737959384918213, 2.7928175926208496, 2.911839008331299, 3.030860424041748, 3.1498820781707764, 3.2689034938812256, 3.387924909591675, 3.506946563720703, 3.6259679794311523, 3.7449893951416016, 3.864010810852051]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 13.0, 12.0, 12.0, 20.0, 25.0, 38.0, 68.0, 119.0, 205.0, 362.0, 713.0, 1964.0, 5882.0, 24417.0, 155221.0, 633606.0, 186653.0, 28762.0, 6679.0, 2088.0, 804.0, 415.0, 180.0, 79.0, 65.0, 53.0, 23.0, 16.0, 21.0, 10.0, 6.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.299713134765625, -2.22442626953125, -2.149139404296875, -2.0738525390625, -1.998565673828125, -1.92327880859375, -1.847991943359375, -1.772705078125, -1.697418212890625, -1.62213134765625, -1.546844482421875, -1.4715576171875, -1.396270751953125, -1.32098388671875, -1.245697021484375, -1.17041015625, -1.095123291015625, -1.01983642578125, -0.944549560546875, -0.8692626953125, -0.793975830078125, -0.71868896484375, -0.643402099609375, -0.568115234375, -0.492828369140625, -0.41754150390625, -0.342254638671875, -0.2669677734375, -0.191680908203125, -0.11639404296875, -0.041107177734375, 0.0341796875, 0.109466552734375, 0.18475341796875, 0.260040283203125, 0.3353271484375, 0.410614013671875, 0.48590087890625, 0.561187744140625, 0.636474609375, 0.711761474609375, 0.78704833984375, 0.862335205078125, 0.9376220703125, 1.012908935546875, 1.08819580078125, 1.163482666015625, 1.23876953125, 1.314056396484375, 1.38934326171875, 1.464630126953125, 1.5399169921875, 1.615203857421875, 1.69049072265625, 1.765777587890625, 1.841064453125, 1.916351318359375, 1.99163818359375, 2.066925048828125, 2.1422119140625, 2.217498779296875, 2.29278564453125, 2.368072509765625, 2.443359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 16.0, 18.0, 23.0, 40.0, 50.0, 40.0, 53.0, 72.0, 74.0, 80.0, 92.0, 65.0, 79.0, 77.0, 45.0, 41.0, 30.0, 24.0, 18.0, 16.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.62451171875, -0.60888671875, -0.59326171875, -0.57763671875, -0.56201171875, -0.54638671875, -0.53076171875, -0.51513671875, -0.49951171875, -0.48388671875, -0.46826171875, -0.45263671875, -0.43701171875, -0.42138671875, -0.40576171875, -0.39013671875, -0.37451171875, -0.35888671875, -0.34326171875, -0.32763671875, -0.31201171875, -0.29638671875, -0.28076171875, -0.26513671875, -0.24951171875, -0.23388671875, -0.21826171875, -0.20263671875, -0.18701171875, -0.17138671875, -0.15576171875, -0.14013671875, -0.12451171875, -0.10888671875, -0.09326171875, -0.07763671875, -0.06201171875, -0.04638671875, -0.03076171875, -0.01513671875, 0.00048828125, 0.01611328125, 0.03173828125, 0.04736328125, 0.06298828125, 0.07861328125, 0.09423828125, 0.10986328125, 0.12548828125, 0.14111328125, 0.15673828125, 0.17236328125, 0.18798828125, 0.20361328125, 0.21923828125, 0.23486328125, 0.25048828125, 0.26611328125, 0.28173828125, 0.29736328125, 0.31298828125, 0.32861328125, 0.34423828125, 0.35986328125, 0.37548828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 8.0, 1.0, 5.0, 6.0, 10.0, 7.0, 16.0, 27.0, 32.0, 36.0, 66.0, 89.0, 130.0, 218.0, 362.0, 640.0, 1220.0, 2454.0, 5213.0, 12005.0, 30018.0, 83844.0, 231306.0, 374153.0, 192808.0, 69160.0, 25308.0, 10255.0, 4389.0, 2100.0, 1120.0, 589.0, 324.0, 212.0, 133.0, 73.0, 54.0, 39.0, 33.0, 18.0, 20.0, 11.0, 11.0, 13.0, 2.0, 3.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.8651123046875, -0.835693359375, -0.8062744140625, -0.77685546875, -0.7474365234375, -0.718017578125, -0.6885986328125, -0.6591796875, -0.6297607421875, -0.600341796875, -0.5709228515625, -0.54150390625, -0.5120849609375, -0.482666015625, -0.4532470703125, -0.423828125, -0.3944091796875, -0.364990234375, -0.3355712890625, -0.30615234375, -0.2767333984375, -0.247314453125, -0.2178955078125, -0.1884765625, -0.1590576171875, -0.129638671875, -0.1002197265625, -0.07080078125, -0.0413818359375, -0.011962890625, 0.0174560546875, 0.046875, 0.0762939453125, 0.105712890625, 0.1351318359375, 0.16455078125, 0.1939697265625, 0.223388671875, 0.2528076171875, 0.2822265625, 0.3116455078125, 0.341064453125, 0.3704833984375, 0.39990234375, 0.4293212890625, 0.458740234375, 0.4881591796875, 0.517578125, 0.5469970703125, 0.576416015625, 0.6058349609375, 0.63525390625, 0.6646728515625, 0.694091796875, 0.7235107421875, 0.7529296875, 0.7823486328125, 0.811767578125, 0.8411865234375, 0.87060546875, 0.9000244140625, 0.929443359375, 0.9588623046875, 0.98828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 12.0, 9.0, 11.0, 16.0, 22.0, 22.0, 13.0, 34.0, 26.0, 34.0, 36.0, 29.0, 47.0, 51.0, 48.0, 66.0, 46.0, 56.0, 30.0, 41.0, 45.0, 38.0, 31.0, 43.0, 32.0, 21.0, 16.0, 29.0, 22.0, 7.0, 12.0, 9.0, 5.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.18072509765625, -1.1378173828125, -1.09490966796875, -1.052001953125, -1.00909423828125, -0.9661865234375, -0.92327880859375, -0.88037109375, -0.83746337890625, -0.7945556640625, -0.75164794921875, -0.708740234375, -0.66583251953125, -0.6229248046875, -0.58001708984375, -0.537109375, -0.49420166015625, -0.4512939453125, -0.40838623046875, -0.365478515625, -0.32257080078125, -0.2796630859375, -0.23675537109375, -0.19384765625, -0.15093994140625, -0.1080322265625, -0.06512451171875, -0.022216796875, 0.02069091796875, 0.0635986328125, 0.10650634765625, 0.1494140625, 0.19232177734375, 0.2352294921875, 0.27813720703125, 0.321044921875, 0.36395263671875, 0.4068603515625, 0.44976806640625, 0.49267578125, 0.53558349609375, 0.5784912109375, 0.62139892578125, 0.664306640625, 0.70721435546875, 0.7501220703125, 0.79302978515625, 0.8359375, 0.87884521484375, 0.9217529296875, 0.96466064453125, 1.007568359375, 1.05047607421875, 1.0933837890625, 1.13629150390625, 1.17919921875, 1.22210693359375, 1.2650146484375, 1.30792236328125, 1.350830078125, 1.39373779296875, 1.4366455078125, 1.47955322265625, 1.5224609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 19.0, 20.0, 42.0, 49.0, 58.0, 96.0, 165.0, 216.0, 372.0, 670.0, 1408.0, 3565.0, 11993.0, 94883.0, 776643.0, 136286.0, 14642.0, 4112.0, 1531.0, 728.0, 374.0, 224.0, 151.0, 79.0, 50.0, 50.0, 40.0, 25.0, 14.0, 7.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.02734375, -0.9937286376953125, -0.960113525390625, -0.9264984130859375, -0.89288330078125, -0.8592681884765625, -0.825653076171875, -0.7920379638671875, -0.7584228515625, -0.7248077392578125, -0.691192626953125, -0.6575775146484375, -0.62396240234375, -0.5903472900390625, -0.556732177734375, -0.5231170654296875, -0.489501953125, -0.4558868408203125, -0.422271728515625, -0.3886566162109375, -0.35504150390625, -0.3214263916015625, -0.287811279296875, -0.2541961669921875, -0.2205810546875, -0.1869659423828125, -0.153350830078125, -0.1197357177734375, -0.08612060546875, -0.0525054931640625, -0.018890380859375, 0.0147247314453125, 0.04833984375, 0.0819549560546875, 0.115570068359375, 0.1491851806640625, 0.18280029296875, 0.2164154052734375, 0.250030517578125, 0.2836456298828125, 0.3172607421875, 0.3508758544921875, 0.384490966796875, 0.4181060791015625, 0.45172119140625, 0.4853363037109375, 0.518951416015625, 0.5525665283203125, 0.586181640625, 0.6197967529296875, 0.653411865234375, 0.6870269775390625, 0.72064208984375, 0.7542572021484375, 0.787872314453125, 0.8214874267578125, 0.8551025390625, 0.8887176513671875, 0.922332763671875, 0.9559478759765625, 0.98956298828125, 1.0231781005859375, 1.056793212890625, 1.0904083251953125, 1.1240234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 10.0, 19.0, 32.0, 34.0, 65.0, 102.0, 172.0, 187.0, 141.0, 80.0, 71.0, 35.0, 18.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021290406584739685, -0.00020670145750045776, -0.00020049884915351868, -0.0001942962408065796, -0.0001880936324596405, -0.00018189102411270142, -0.00017568841576576233, -0.00016948580741882324, -0.00016328319907188416, -0.00015708059072494507, -0.00015087798237800598, -0.0001446753740310669, -0.0001384727656841278, -0.00013227015733718872, -0.00012606754899024963, -0.00011986494064331055, -0.00011366233229637146, -0.00010745972394943237, -0.00010125711560249329, -9.50545072555542e-05, -8.885189890861511e-05, -8.264929056167603e-05, -7.644668221473694e-05, -7.024407386779785e-05, -6.404146552085876e-05, -5.783885717391968e-05, -5.163624882698059e-05, -4.5433640480041504e-05, -3.923103213310242e-05, -3.302842378616333e-05, -2.6825815439224243e-05, -2.0623207092285156e-05, -1.442059874534607e-05, -8.217990398406982e-06, -2.0153820514678955e-06, 4.187226295471191e-06, 1.0389834642410278e-05, 1.6592442989349365e-05, 2.2795051336288452e-05, 2.899765968322754e-05, 3.5200268030166626e-05, 4.140287637710571e-05, 4.76054847240448e-05, 5.380809307098389e-05, 6.0010701417922974e-05, 6.621330976486206e-05, 7.241591811180115e-05, 7.861852645874023e-05, 8.482113480567932e-05, 9.102374315261841e-05, 9.72263514995575e-05, 0.00010342895984649658, 0.00010963156819343567, 0.00011583417654037476, 0.00012203678488731384, 0.00012823939323425293, 0.00013444200158119202, 0.0001406446099281311, 0.0001468472182750702, 0.00015304982662200928, 0.00015925243496894836, 0.00016545504331588745, 0.00017165765166282654, 0.00017786026000976562]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 15.0, 18.0, 27.0, 44.0, 61.0, 98.0, 143.0, 315.0, 831.0, 2190.0, 8277.0, 76833.0, 794976.0, 147772.0, 12163.0, 2932.0, 965.0, 403.0, 177.0, 100.0, 73.0, 46.0, 31.0, 22.0, 14.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9881591796875, -0.947998046875, -0.9078369140625, -0.86767578125, -0.8275146484375, -0.787353515625, -0.7471923828125, -0.70703125, -0.6668701171875, -0.626708984375, -0.5865478515625, -0.54638671875, -0.5062255859375, -0.466064453125, -0.4259033203125, -0.3857421875, -0.3455810546875, -0.305419921875, -0.2652587890625, -0.22509765625, -0.1849365234375, -0.144775390625, -0.1046142578125, -0.064453125, -0.0242919921875, 0.015869140625, 0.0560302734375, 0.09619140625, 0.1363525390625, 0.176513671875, 0.2166748046875, 0.2568359375, 0.2969970703125, 0.337158203125, 0.3773193359375, 0.41748046875, 0.4576416015625, 0.497802734375, 0.5379638671875, 0.578125, 0.6182861328125, 0.658447265625, 0.6986083984375, 0.73876953125, 0.7789306640625, 0.819091796875, 0.8592529296875, 0.8994140625, 0.9395751953125, 0.979736328125, 1.0198974609375, 1.06005859375, 1.1002197265625, 1.140380859375, 1.1805419921875, 1.220703125, 1.2608642578125, 1.301025390625, 1.3411865234375, 1.38134765625, 1.4215087890625, 1.461669921875, 1.5018310546875, 1.5419921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 8.0, 13.0, 10.0, 31.0, 51.0, 53.0, 94.0, 119.0, 144.0, 137.0, 97.0, 84.0, 52.0, 34.0, 26.0, 14.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.0980300903320312, -1.0671539306640625, -1.0362777709960938, -1.005401611328125, -0.9745254516601562, -0.9436492919921875, -0.9127731323242188, -0.88189697265625, -0.8510208129882812, -0.8201446533203125, -0.7892684936523438, -0.758392333984375, -0.7275161743164062, -0.6966400146484375, -0.6657638549804688, -0.6348876953125, -0.6040115356445312, -0.5731353759765625, -0.5422592163085938, -0.511383056640625, -0.48050689697265625, -0.4496307373046875, -0.41875457763671875, -0.38787841796875, -0.35700225830078125, -0.3261260986328125, -0.29524993896484375, -0.264373779296875, -0.23349761962890625, -0.2026214599609375, -0.17174530029296875, -0.140869140625, -0.10999298095703125, -0.0791168212890625, -0.04824066162109375, -0.017364501953125, 0.01351165771484375, 0.0443878173828125, 0.07526397705078125, 0.10614013671875, 0.13701629638671875, 0.1678924560546875, 0.19876861572265625, 0.229644775390625, 0.26052093505859375, 0.2913970947265625, 0.32227325439453125, 0.3531494140625, 0.38402557373046875, 0.4149017333984375, 0.44577789306640625, 0.476654052734375, 0.5075302124023438, 0.5384063720703125, 0.5692825317382812, 0.60015869140625, 0.6310348510742188, 0.6619110107421875, 0.6927871704101562, 0.723663330078125, 0.7545394897460938, 0.7854156494140625, 0.8162918090820312, 0.84716796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 11.0, 16.0, 29.0, 64.0, 112.0, 142.0, 196.0, 177.0, 130.0, 59.0, 35.0, 13.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208967208862305, -8.721240043640137, -8.233511924743652, -7.745784282684326, -7.258056640625, -6.770329475402832, -6.282601356506348, -5.79487419128418, -5.307146072387695, -4.819418430328369, -4.331690788269043, -3.843963146209717, -3.3562355041503906, -2.8685081005096436, -2.3807804584503174, -1.8930528163909912, -1.4053254127502441, -0.917597770690918, -0.4298701882362366, 0.057857394218444824, 0.545585036277771, 1.0333125591278076, 1.5210402011871338, 2.00876784324646, 2.496495485305786, 2.9842231273651123, 3.4719507694244385, 3.9596781730651855, 4.447405815124512, 4.935133457183838, 5.422861099243164, 5.91058874130249, 6.398316383361816, 6.886044025421143, 7.373771667480469, 7.861499309539795, 8.349226951599121, 8.836954116821289, 9.324682235717773, 9.812409400939941, 10.300137519836426, 10.787864685058594, 11.275592803955078, 11.763319969177246, 12.25104808807373, 12.738775253295898, 13.226503372192383, 13.71423053741455, 14.201957702636719, 14.689684867858887, 15.177412986755371, 15.665140151977539, 16.152868270874023, 16.640596389770508, 17.12832260131836, 17.616050720214844, 18.103778839111328, 18.591506958007812, 19.079233169555664, 19.56696128845215, 20.054689407348633, 20.542417526245117, 21.03014373779297, 21.517871856689453, 22.005599975585938]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 6.0, 6.0, 5.0, 9.0, 9.0, 6.0, 8.0, 16.0, 12.0, 13.0, 14.0, 22.0, 15.0, 25.0, 24.0, 27.0, 31.0, 35.0, 15.0, 41.0, 36.0, 54.0, 43.0, 41.0, 41.0, 39.0, 25.0, 41.0, 44.0, 42.0, 37.0, 33.0, 26.0, 31.0, 19.0, 21.0, 13.0, 16.0, 14.0, 11.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.625533580780029, -6.410942554473877, -6.196352005004883, -5.9817609786987305, -5.767169952392578, -5.552578926086426, -5.337987899780273, -5.123397350311279, -4.908806324005127, -4.694215297698975, -4.4796247482299805, -4.265033721923828, -4.050442695617676, -3.8358516693115234, -3.62126088142395, -3.406670093536377, -3.1920790672302246, -2.9774880409240723, -2.762897253036499, -2.548306465148926, -2.3337154388427734, -2.119124412536621, -1.9045336246490479, -1.689942717552185, -1.4753518104553223, -1.2607609033584595, -1.0461699962615967, -0.8315790891647339, -0.6169881820678711, -0.4023972749710083, -0.1878063678741455, 0.026784539222717285, 0.24137544631958008, 0.45596635341644287, 0.6705572605133057, 0.8851481676101685, 1.0997390747070312, 1.314329981803894, 1.5289208889007568, 1.7435117959976196, 1.9581027030944824, 2.1726937294006348, 2.387284517288208, 2.6018753051757812, 2.8164663314819336, 3.031057357788086, 3.245648145675659, 3.4602389335632324, 3.6748299598693848, 3.889420986175537, 4.104011535644531, 4.318602561950684, 4.533193588256836, 4.747784614562988, 4.962375640869141, 5.176966190338135, 5.391557216644287, 5.6061482429504395, 5.820738792419434, 6.035329818725586, 6.249920845031738, 6.464511871337891, 6.679102897644043, 6.893693447113037, 7.1082844734191895]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 3.0, 2.0, 6.0, 8.0, 16.0, 15.0, 24.0, 30.0, 36.0, 44.0, 81.0, 125.0, 185.0, 388.0, 867.0, 2393.0, 7723.0, 40197.0, 3689287.0, 418364.0, 25093.0, 5818.0, 1962.0, 815.0, 387.0, 159.0, 104.0, 52.0, 26.0, 29.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0], "bins": [-5.484375, -5.362152099609375, -5.23992919921875, -5.117706298828125, -4.9954833984375, -4.873260498046875, -4.75103759765625, -4.628814697265625, -4.506591796875, -4.384368896484375, -4.26214599609375, -4.139923095703125, -4.0177001953125, -3.895477294921875, -3.77325439453125, -3.651031494140625, -3.52880859375, -3.406585693359375, -3.28436279296875, -3.162139892578125, -3.0399169921875, -2.917694091796875, -2.79547119140625, -2.673248291015625, -2.551025390625, -2.428802490234375, -2.30657958984375, -2.184356689453125, -2.0621337890625, -1.939910888671875, -1.81768798828125, -1.695465087890625, -1.5732421875, -1.451019287109375, -1.32879638671875, -1.206573486328125, -1.0843505859375, -0.962127685546875, -0.83990478515625, -0.717681884765625, -0.595458984375, -0.473236083984375, -0.35101318359375, -0.228790283203125, -0.1065673828125, 0.015655517578125, 0.13787841796875, 0.260101318359375, 0.38232421875, 0.504547119140625, 0.62677001953125, 0.748992919921875, 0.8712158203125, 0.993438720703125, 1.11566162109375, 1.237884521484375, 1.360107421875, 1.482330322265625, 1.60455322265625, 1.726776123046875, 1.8489990234375, 1.971221923828125, 2.09344482421875, 2.215667724609375, 2.337890625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 11.0, 8.0, 19.0, 14.0, 16.0, 24.0, 35.0, 34.0, 33.0, 64.0, 54.0, 59.0, 52.0, 67.0, 60.0, 79.0, 74.0, 60.0, 37.0, 34.0, 35.0, 31.0, 19.0, 20.0, 15.0, 12.0, 10.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.58984375, -0.5746307373046875, -0.559417724609375, -0.5442047119140625, -0.52899169921875, -0.5137786865234375, -0.498565673828125, -0.4833526611328125, -0.4681396484375, -0.4529266357421875, -0.437713623046875, -0.4225006103515625, -0.40728759765625, -0.3920745849609375, -0.376861572265625, -0.3616485595703125, -0.346435546875, -0.3312225341796875, -0.316009521484375, -0.3007965087890625, -0.28558349609375, -0.2703704833984375, -0.255157470703125, -0.2399444580078125, -0.2247314453125, -0.2095184326171875, -0.194305419921875, -0.1790924072265625, -0.16387939453125, -0.1486663818359375, -0.133453369140625, -0.1182403564453125, -0.10302734375, -0.0878143310546875, -0.072601318359375, -0.0573883056640625, -0.04217529296875, -0.0269622802734375, -0.011749267578125, 0.0034637451171875, 0.0186767578125, 0.0338897705078125, 0.049102783203125, 0.0643157958984375, 0.07952880859375, 0.0947418212890625, 0.109954833984375, 0.1251678466796875, 0.140380859375, 0.1555938720703125, 0.170806884765625, 0.1860198974609375, 0.20123291015625, 0.2164459228515625, 0.231658935546875, 0.2468719482421875, 0.2620849609375, 0.2772979736328125, 0.292510986328125, 0.3077239990234375, 0.32293701171875, 0.3381500244140625, 0.353363037109375, 0.3685760498046875, 0.3837890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 3.0, 9.0, 6.0, 7.0, 5.0, 8.0, 18.0, 26.0, 23.0, 46.0, 67.0, 68.0, 96.0, 154.0, 269.0, 430.0, 613.0, 1069.0, 2045.0, 4390.0, 10817.0, 42055.0, 444024.0, 3554445.0, 101146.0, 19329.0, 6485.0, 2889.0, 1435.0, 809.0, 527.0, 286.0, 191.0, 140.0, 95.0, 64.0, 44.0, 26.0, 30.0, 30.0, 13.0, 8.0, 4.0, 8.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.1953125, -2.125030517578125, -2.05474853515625, -1.984466552734375, -1.9141845703125, -1.843902587890625, -1.77362060546875, -1.703338623046875, -1.633056640625, -1.562774658203125, -1.49249267578125, -1.422210693359375, -1.3519287109375, -1.281646728515625, -1.21136474609375, -1.141082763671875, -1.07080078125, -1.000518798828125, -0.93023681640625, -0.859954833984375, -0.7896728515625, -0.719390869140625, -0.64910888671875, -0.578826904296875, -0.508544921875, -0.438262939453125, -0.36798095703125, -0.297698974609375, -0.2274169921875, -0.157135009765625, -0.08685302734375, -0.016571044921875, 0.0537109375, 0.123992919921875, 0.19427490234375, 0.264556884765625, 0.3348388671875, 0.405120849609375, 0.47540283203125, 0.545684814453125, 0.615966796875, 0.686248779296875, 0.75653076171875, 0.826812744140625, 0.8970947265625, 0.967376708984375, 1.03765869140625, 1.107940673828125, 1.17822265625, 1.248504638671875, 1.31878662109375, 1.389068603515625, 1.4593505859375, 1.529632568359375, 1.59991455078125, 1.670196533203125, 1.740478515625, 1.810760498046875, 1.88104248046875, 1.951324462890625, 2.0216064453125, 2.091888427734375, 2.16217041015625, 2.232452392578125, 2.302734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 3.0, 5.0, 13.0, 14.0, 22.0, 26.0, 54.0, 158.0, 456.0, 2427.0, 512.0, 161.0, 88.0, 37.0, 27.0, 17.0, 10.0, 12.0, 9.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.314453125, -1.2740631103515625, -1.233673095703125, -1.1932830810546875, -1.15289306640625, -1.1125030517578125, -1.072113037109375, -1.0317230224609375, -0.9913330078125, -0.9509429931640625, -0.910552978515625, -0.8701629638671875, -0.82977294921875, -0.7893829345703125, -0.748992919921875, -0.7086029052734375, -0.668212890625, -0.6278228759765625, -0.587432861328125, -0.5470428466796875, -0.50665283203125, -0.4662628173828125, -0.425872802734375, -0.3854827880859375, -0.3450927734375, -0.3047027587890625, -0.264312744140625, -0.2239227294921875, -0.18353271484375, -0.1431427001953125, -0.102752685546875, -0.0623626708984375, -0.02197265625, 0.0184173583984375, 0.058807373046875, 0.0991973876953125, 0.13958740234375, 0.1799774169921875, 0.220367431640625, 0.2607574462890625, 0.3011474609375, 0.3415374755859375, 0.381927490234375, 0.4223175048828125, 0.46270751953125, 0.5030975341796875, 0.543487548828125, 0.5838775634765625, 0.624267578125, 0.6646575927734375, 0.705047607421875, 0.7454376220703125, 0.78582763671875, 0.8262176513671875, 0.866607666015625, 0.9069976806640625, 0.9473876953125, 0.9877777099609375, 1.028167724609375, 1.0685577392578125, 1.10894775390625, 1.1493377685546875, 1.189727783203125, 1.2301177978515625, 1.2705078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 23.0, 72.0, 194.0, 270.0, 247.0, 94.0, 54.0, 21.0, 5.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.648687362670898, -4.309000015258789, -3.9693121910095215, -3.629624843597412, -3.2899370193481445, -2.950249671936035, -2.6105620861053467, -2.270874500274658, -1.9311869144439697, -1.5914993286132812, -1.2518117427825928, -0.9121242761611938, -0.5724366903305054, -0.2327491044998169, 0.10693836212158203, 0.4466259479522705, 0.786313533782959, 1.1260011196136475, 1.465688705444336, 1.8053761720657349, 2.145063877105713, 2.4847512245178223, 2.8244388103485107, 3.164126396179199, 3.5038139820098877, 3.843501567840576, 4.1831889152526855, 4.522876739501953, 4.8625640869140625, 5.20225191116333, 5.5419392585754395, 5.881627082824707, 6.221314430236816, 6.561001777648926, 6.900689601898193, 7.240376949310303, 7.58006477355957, 7.91975212097168, 8.259439468383789, 8.599126815795898, 8.938815116882324, 9.278502464294434, 9.618189811706543, 9.957878112792969, 10.297565460205078, 10.637252807617188, 10.976940155029297, 11.316627502441406, 11.656314849853516, 11.996002197265625, 12.335689544677734, 12.67537784576416, 13.01506519317627, 13.354752540588379, 13.694439888000488, 14.034128189086914, 14.373815536499023, 14.713502883911133, 15.053190231323242, 15.392878532409668, 15.732565879821777, 16.072254180908203, 16.411941528320312, 16.751628875732422, 17.09131622314453]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 9.0, 8.0, 13.0, 33.0, 31.0, 39.0, 64.0, 71.0, 90.0, 75.0, 89.0, 105.0, 84.0, 68.0, 54.0, 47.0, 42.0, 26.0, 22.0, 17.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.562389373779297, -5.396784782409668, -5.231180191040039, -5.06557559967041, -4.899971008300781, -4.734366416931152, -4.568761825561523, -4.4031572341918945, -4.237552642822266, -4.071948051452637, -3.906343460083008, -3.740738868713379, -3.57513427734375, -3.409529685974121, -3.243924856185913, -3.078320264816284, -2.912715435028076, -2.7471108436584473, -2.5815062522888184, -2.4159016609191895, -2.2502970695495605, -2.0846924781799316, -1.9190876483917236, -1.7534830570220947, -1.5878784656524658, -1.422273874282837, -1.256669282913208, -1.0910645723342896, -0.9254599809646606, -0.7598553895950317, -0.5942507386207581, -0.4286460876464844, -0.26304149627685547, -0.09743687510490417, 0.06816774606704712, 0.2337723672389984, 0.3993769884109497, 0.5649815797805786, 0.7305862307548523, 0.896190881729126, 1.0617954730987549, 1.2274000644683838, 1.3930046558380127, 1.5586093664169312, 1.72421395778656, 1.889818549156189, 2.0554232597351074, 2.2210278511047363, 2.3866324424743652, 2.552237033843994, 2.717841625213623, 2.883446216583252, 3.049050807952881, 3.2146553993225098, 3.3802602291107178, 3.5458648204803467, 3.7114694118499756, 3.8770740032196045, 4.0426788330078125, 4.208283424377441, 4.37388801574707, 4.539492607116699, 4.705097198486328, 4.870701789855957, 5.036306381225586]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 9.0, 5.0, 5.0, 8.0, 16.0, 19.0, 34.0, 55.0, 76.0, 153.0, 306.0, 666.0, 1633.0, 4864.0, 17796.0, 84524.0, 434452.0, 403895.0, 76191.0, 16503.0, 4620.0, 1510.0, 568.0, 275.0, 145.0, 81.0, 38.0, 35.0, 18.0, 15.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.70361328125, -2.6240234375, -2.54443359375, -2.46484375, -2.38525390625, -2.3056640625, -2.22607421875, -2.146484375, -2.06689453125, -1.9873046875, -1.90771484375, -1.828125, -1.74853515625, -1.6689453125, -1.58935546875, -1.509765625, -1.43017578125, -1.3505859375, -1.27099609375, -1.19140625, -1.11181640625, -1.0322265625, -0.95263671875, -0.873046875, -0.79345703125, -0.7138671875, -0.63427734375, -0.5546875, -0.47509765625, -0.3955078125, -0.31591796875, -0.236328125, -0.15673828125, -0.0771484375, 0.00244140625, 0.08203125, 0.16162109375, 0.2412109375, 0.32080078125, 0.400390625, 0.47998046875, 0.5595703125, 0.63916015625, 0.71875, 0.79833984375, 0.8779296875, 0.95751953125, 1.037109375, 1.11669921875, 1.1962890625, 1.27587890625, 1.35546875, 1.43505859375, 1.5146484375, 1.59423828125, 1.673828125, 1.75341796875, 1.8330078125, 1.91259765625, 1.9921875, 2.07177734375, 2.1513671875, 2.23095703125, 2.310546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 7.0, 8.0, 9.0, 15.0, 15.0, 19.0, 21.0, 44.0, 44.0, 35.0, 36.0, 40.0, 68.0, 54.0, 81.0, 67.0, 77.0, 70.0, 50.0, 44.0, 37.0, 36.0, 29.0, 22.0, 20.0, 17.0, 9.0, 6.0, 5.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6293830871582031, -0.6127700805664062, -0.5961570739746094, -0.5795440673828125, -0.5629310607910156, -0.5463180541992188, -0.5297050476074219, -0.513092041015625, -0.4964790344238281, -0.47986602783203125, -0.4632530212402344, -0.4466400146484375, -0.4300270080566406, -0.41341400146484375, -0.3968009948730469, -0.38018798828125, -0.3635749816894531, -0.34696197509765625, -0.3303489685058594, -0.3137359619140625, -0.2971229553222656, -0.28050994873046875, -0.2638969421386719, -0.247283935546875, -0.23067092895507812, -0.21405792236328125, -0.19744491577148438, -0.1808319091796875, -0.16421890258789062, -0.14760589599609375, -0.13099288940429688, -0.1143798828125, -0.09776687622070312, -0.08115386962890625, -0.06454086303710938, -0.0479278564453125, -0.031314849853515625, -0.01470184326171875, 0.001911163330078125, 0.018524169921875, 0.035137176513671875, 0.05175018310546875, 0.06836318969726562, 0.0849761962890625, 0.10158920288085938, 0.11820220947265625, 0.13481521606445312, 0.15142822265625, 0.16804122924804688, 0.18465423583984375, 0.20126724243164062, 0.2178802490234375, 0.23449325561523438, 0.25110626220703125, 0.2677192687988281, 0.284332275390625, 0.3009452819824219, 0.31755828857421875, 0.3341712951660156, 0.3507843017578125, 0.3673973083496094, 0.38401031494140625, 0.4006233215332031, 0.417236328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 22.0, 11.0, 15.0, 27.0, 56.0, 94.0, 109.0, 206.0, 467.0, 924.0, 1896.0, 4329.0, 10595.0, 29847.0, 109112.0, 397174.0, 356843.0, 93565.0, 26708.0, 9271.0, 3789.0, 1718.0, 825.0, 388.0, 238.0, 133.0, 59.0, 39.0, 28.0, 26.0, 19.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.331390380859375, -1.27801513671875, -1.224639892578125, -1.1712646484375, -1.117889404296875, -1.06451416015625, -1.011138916015625, -0.957763671875, -0.904388427734375, -0.85101318359375, -0.797637939453125, -0.7442626953125, -0.690887451171875, -0.63751220703125, -0.584136962890625, -0.53076171875, -0.477386474609375, -0.42401123046875, -0.370635986328125, -0.3172607421875, -0.263885498046875, -0.21051025390625, -0.157135009765625, -0.103759765625, -0.050384521484375, 0.00299072265625, 0.056365966796875, 0.1097412109375, 0.163116455078125, 0.21649169921875, 0.269866943359375, 0.3232421875, 0.376617431640625, 0.42999267578125, 0.483367919921875, 0.5367431640625, 0.590118408203125, 0.64349365234375, 0.696868896484375, 0.750244140625, 0.803619384765625, 0.85699462890625, 0.910369873046875, 0.9637451171875, 1.017120361328125, 1.07049560546875, 1.123870849609375, 1.17724609375, 1.230621337890625, 1.28399658203125, 1.337371826171875, 1.3907470703125, 1.444122314453125, 1.49749755859375, 1.550872802734375, 1.604248046875, 1.657623291015625, 1.71099853515625, 1.764373779296875, 1.8177490234375, 1.871124267578125, 1.92449951171875, 1.977874755859375, 2.03125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 5.0, 7.0, 2.0, 11.0, 9.0, 21.0, 15.0, 17.0, 18.0, 18.0, 32.0, 25.0, 51.0, 51.0, 45.0, 55.0, 54.0, 57.0, 55.0, 47.0, 59.0, 55.0, 48.0, 40.0, 41.0, 28.0, 29.0, 19.0, 16.0, 13.0, 9.0, 8.0, 10.0, 5.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.034698486328125, -1.96392822265625, -1.893157958984375, -1.8223876953125, -1.751617431640625, -1.68084716796875, -1.610076904296875, -1.539306640625, -1.468536376953125, -1.39776611328125, -1.326995849609375, -1.2562255859375, -1.185455322265625, -1.11468505859375, -1.043914794921875, -0.97314453125, -0.902374267578125, -0.83160400390625, -0.760833740234375, -0.6900634765625, -0.619293212890625, -0.54852294921875, -0.477752685546875, -0.406982421875, -0.336212158203125, -0.26544189453125, -0.194671630859375, -0.1239013671875, -0.053131103515625, 0.01763916015625, 0.088409423828125, 0.1591796875, 0.229949951171875, 0.30072021484375, 0.371490478515625, 0.4422607421875, 0.513031005859375, 0.58380126953125, 0.654571533203125, 0.725341796875, 0.796112060546875, 0.86688232421875, 0.937652587890625, 1.0084228515625, 1.079193115234375, 1.14996337890625, 1.220733642578125, 1.29150390625, 1.362274169921875, 1.43304443359375, 1.503814697265625, 1.5745849609375, 1.645355224609375, 1.71612548828125, 1.786895751953125, 1.857666015625, 1.928436279296875, 1.99920654296875, 2.069976806640625, 2.1407470703125, 2.211517333984375, 2.28228759765625, 2.353057861328125, 2.423828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 12.0, 12.0, 16.0, 36.0, 38.0, 74.0, 115.0, 220.0, 382.0, 739.0, 1682.0, 5380.0, 24594.0, 165052.0, 642676.0, 172988.0, 25366.0, 5763.0, 1801.0, 706.0, 373.0, 228.0, 106.0, 81.0, 36.0, 20.0, 19.0, 11.0, 4.0, 3.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.248046875, -1.211883544921875, -1.17572021484375, -1.139556884765625, -1.1033935546875, -1.067230224609375, -1.03106689453125, -0.994903564453125, -0.958740234375, -0.922576904296875, -0.88641357421875, -0.850250244140625, -0.8140869140625, -0.777923583984375, -0.74176025390625, -0.705596923828125, -0.66943359375, -0.633270263671875, -0.59710693359375, -0.560943603515625, -0.5247802734375, -0.488616943359375, -0.45245361328125, -0.416290283203125, -0.380126953125, -0.343963623046875, -0.30780029296875, -0.271636962890625, -0.2354736328125, -0.199310302734375, -0.16314697265625, -0.126983642578125, -0.0908203125, -0.054656982421875, -0.01849365234375, 0.017669677734375, 0.0538330078125, 0.089996337890625, 0.12615966796875, 0.162322998046875, 0.198486328125, 0.234649658203125, 0.27081298828125, 0.306976318359375, 0.3431396484375, 0.379302978515625, 0.41546630859375, 0.451629638671875, 0.48779296875, 0.523956298828125, 0.56011962890625, 0.596282958984375, 0.6324462890625, 0.668609619140625, 0.70477294921875, 0.740936279296875, 0.777099609375, 0.813262939453125, 0.84942626953125, 0.885589599609375, 0.9217529296875, 0.957916259765625, 0.99407958984375, 1.030242919921875, 1.06640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 14.0, 16.0, 24.0, 53.0, 66.0, 75.0, 112.0, 135.0, 132.0, 104.0, 71.0, 68.0, 35.0, 27.0, 18.0, 9.0, 19.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001571178436279297, -0.0001510903239250183, -0.00014506280422210693, -0.00013903528451919556, -0.00013300776481628418, -0.0001269802451133728, -0.00012095272541046143, -0.00011492520570755005, -0.00010889768600463867, -0.0001028701663017273, -9.684264659881592e-05, -9.081512689590454e-05, -8.478760719299316e-05, -7.876008749008179e-05, -7.273256778717041e-05, -6.670504808425903e-05, -6.0677528381347656e-05, -5.465000867843628e-05, -4.86224889755249e-05, -4.2594969272613525e-05, -3.656744956970215e-05, -3.053992986679077e-05, -2.4512410163879395e-05, -1.8484890460968018e-05, -1.245737075805664e-05, -6.429851055145264e-06, -4.023313522338867e-07, 5.62518835067749e-06, 1.1652708053588867e-05, 1.7680227756500244e-05, 2.370774745941162e-05, 2.9735267162322998e-05, 3.5762786865234375e-05, 4.179030656814575e-05, 4.781782627105713e-05, 5.3845345973968506e-05, 5.987286567687988e-05, 6.590038537979126e-05, 7.192790508270264e-05, 7.795542478561401e-05, 8.398294448852539e-05, 9.001046419143677e-05, 9.603798389434814e-05, 0.00010206550359725952, 0.0001080930233001709, 0.00011412054300308228, 0.00012014806270599365, 0.00012617558240890503, 0.0001322031021118164, 0.00013823062181472778, 0.00014425814151763916, 0.00015028566122055054, 0.00015631318092346191, 0.0001623407006263733, 0.00016836822032928467, 0.00017439574003219604, 0.00018042325973510742, 0.0001864507794380188, 0.00019247829914093018, 0.00019850581884384155, 0.00020453333854675293, 0.0002105608582496643, 0.00021658837795257568, 0.00022261589765548706, 0.00022864341735839844]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 11.0, 4.0, 10.0, 4.0, 9.0, 23.0, 32.0, 35.0, 67.0, 98.0, 241.0, 464.0, 1161.0, 3943.0, 17746.0, 122127.0, 606771.0, 253001.0, 33406.0, 6367.0, 1755.0, 640.0, 271.0, 157.0, 83.0, 47.0, 36.0, 20.0, 13.0, 12.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.5205078125, -1.4840240478515625, -1.447540283203125, -1.4110565185546875, -1.37457275390625, -1.3380889892578125, -1.301605224609375, -1.2651214599609375, -1.2286376953125, -1.1921539306640625, -1.155670166015625, -1.1191864013671875, -1.08270263671875, -1.0462188720703125, -1.009735107421875, -0.9732513427734375, -0.936767578125, -0.9002838134765625, -0.863800048828125, -0.8273162841796875, -0.79083251953125, -0.7543487548828125, -0.717864990234375, -0.6813812255859375, -0.6448974609375, -0.6084136962890625, -0.571929931640625, -0.5354461669921875, -0.49896240234375, -0.4624786376953125, -0.425994873046875, -0.3895111083984375, -0.35302734375, -0.3165435791015625, -0.280059814453125, -0.2435760498046875, -0.20709228515625, -0.1706085205078125, -0.134124755859375, -0.0976409912109375, -0.0611572265625, -0.0246734619140625, 0.011810302734375, 0.0482940673828125, 0.08477783203125, 0.1212615966796875, 0.157745361328125, 0.1942291259765625, 0.230712890625, 0.2671966552734375, 0.303680419921875, 0.3401641845703125, 0.37664794921875, 0.4131317138671875, 0.449615478515625, 0.4860992431640625, 0.5225830078125, 0.5590667724609375, 0.595550537109375, 0.6320343017578125, 0.66851806640625, 0.7050018310546875, 0.741485595703125, 0.7779693603515625, 0.814453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 16.0, 29.0, 32.0, 32.0, 62.0, 101.0, 140.0, 163.0, 113.0, 88.0, 58.0, 39.0, 26.0, 26.0, 17.0, 6.0, 15.0, 7.0, 3.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.7821502685546875, -1.738128662109375, -1.6941070556640625, -1.65008544921875, -1.6060638427734375, -1.562042236328125, -1.5180206298828125, -1.4739990234375, -1.4299774169921875, -1.385955810546875, -1.3419342041015625, -1.29791259765625, -1.2538909912109375, -1.209869384765625, -1.1658477783203125, -1.121826171875, -1.0778045654296875, -1.033782958984375, -0.9897613525390625, -0.94573974609375, -0.9017181396484375, -0.857696533203125, -0.8136749267578125, -0.7696533203125, -0.7256317138671875, -0.681610107421875, -0.6375885009765625, -0.59356689453125, -0.5495452880859375, -0.505523681640625, -0.4615020751953125, -0.41748046875, -0.3734588623046875, -0.329437255859375, -0.2854156494140625, -0.24139404296875, -0.1973724365234375, -0.153350830078125, -0.1093292236328125, -0.0653076171875, -0.0212860107421875, 0.022735595703125, 0.0667572021484375, 0.11077880859375, 0.1548004150390625, 0.198822021484375, 0.2428436279296875, 0.286865234375, 0.3308868408203125, 0.374908447265625, 0.4189300537109375, 0.46295166015625, 0.5069732666015625, 0.550994873046875, 0.5950164794921875, 0.6390380859375, 0.6830596923828125, 0.727081298828125, 0.7711029052734375, 0.81512451171875, 0.8591461181640625, 0.903167724609375, 0.9471893310546875, 0.9912109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 24.0, 38.0, 180.0, 330.0, 287.0, 115.0, 28.0, 10.0], "bins": [-77.53179931640625, -76.23814392089844, -74.9444808959961, -73.65082550048828, -72.35717010498047, -71.06350708007812, -69.76985168457031, -68.4761962890625, -67.18254089355469, -65.88888549804688, -64.59522247314453, -63.30156707763672, -62.007911682128906, -60.71425247192383, -59.42059326171875, -58.12693786621094, -56.833274841308594, -55.539615631103516, -54.2459602355957, -52.952301025390625, -51.65864562988281, -50.364986419677734, -49.071327209472656, -47.777671813964844, -46.484012603759766, -45.19035339355469, -43.896697998046875, -42.6030387878418, -41.30937957763672, -40.015724182128906, -38.72206497192383, -37.42840576171875, -36.13474655151367, -34.841087341308594, -33.54743194580078, -32.2537727355957, -30.960115432739258, -29.666458129882812, -28.372798919677734, -27.07914161682129, -25.785486221313477, -24.49182891845703, -23.198169708251953, -21.904512405395508, -20.610855102539062, -19.317197799682617, -18.023540496826172, -16.729881286621094, -15.436223983764648, -14.142566680908203, -12.848908424377441, -11.55525016784668, -10.261592864990234, -8.967935562133789, -7.674277305603027, -6.380619049072266, -5.086961269378662, -3.7933034896850586, -2.499645709991455, -1.2059879302978516, 0.08766984939575195, 1.3813276290893555, 2.674985408782959, 3.9686436653137207, 5.262300968170166]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 12.0, 10.0, 10.0, 27.0, 17.0, 17.0, 24.0, 34.0, 37.0, 36.0, 38.0, 57.0, 54.0, 63.0, 62.0, 51.0, 77.0, 56.0, 53.0, 35.0, 43.0, 28.0, 34.0, 28.0, 27.0, 27.0, 16.0, 18.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.77413558959961, -13.325748443603516, -12.877361297607422, -12.428975105285645, -11.98058795928955, -11.532200813293457, -11.08381462097168, -10.635427474975586, -10.187040328979492, -9.738653182983398, -9.290266036987305, -8.841879844665527, -8.393492698669434, -7.94510555267334, -7.496718883514404, -7.048332214355469, -6.599945068359375, -6.151557922363281, -5.703171253204346, -5.25478458404541, -4.806397438049316, -4.358010292053223, -3.909623622894287, -3.4612367153167725, -3.012849807739258, -2.564462900161743, -2.1160759925842285, -1.6676890850067139, -1.2193021774291992, -0.7709152698516846, -0.3225283622741699, 0.12585854530334473, 0.5742454528808594, 1.022632360458374, 1.4710192680358887, 1.9194061756134033, 2.367793083190918, 2.8161799907684326, 3.2645668983459473, 3.712953805923462, 4.161340713500977, 4.60972785949707, 5.058114528656006, 5.506501197814941, 5.954888343811035, 6.403275489807129, 6.8516621589660645, 7.300048828125, 7.748435974121094, 8.196823120117188, 8.645210266113281, 9.093596458435059, 9.541983604431152, 9.990370750427246, 10.438756942749023, 10.887144088745117, 11.335531234741211, 11.783918380737305, 12.232305526733398, 12.680691719055176, 13.12907886505127, 13.577466011047363, 14.02585220336914, 14.474239349365234, 14.922626495361328]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 5.0, 4.0, 10.0, 9.0, 8.0, 18.0, 49.0, 71.0, 132.0, 323.0, 866.0, 2506.0, 13404.0, 4098100.0, 70732.0, 5577.0, 1454.0, 538.0, 203.0, 102.0, 71.0, 24.0, 22.0, 17.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0], "bins": [-7.82421875, -7.653289794921875, -7.48236083984375, -7.311431884765625, -7.1405029296875, -6.969573974609375, -6.79864501953125, -6.627716064453125, -6.456787109375, -6.285858154296875, -6.11492919921875, -5.944000244140625, -5.7730712890625, -5.602142333984375, -5.43121337890625, -5.260284423828125, -5.08935546875, -4.918426513671875, -4.74749755859375, -4.576568603515625, -4.4056396484375, -4.234710693359375, -4.06378173828125, -3.892852783203125, -3.721923828125, -3.550994873046875, -3.38006591796875, -3.209136962890625, -3.0382080078125, -2.867279052734375, -2.69635009765625, -2.525421142578125, -2.3544921875, -2.183563232421875, -2.01263427734375, -1.841705322265625, -1.6707763671875, -1.499847412109375, -1.32891845703125, -1.157989501953125, -0.987060546875, -0.816131591796875, -0.64520263671875, -0.474273681640625, -0.3033447265625, -0.132415771484375, 0.03851318359375, 0.209442138671875, 0.38037109375, 0.551300048828125, 0.72222900390625, 0.893157958984375, 1.0640869140625, 1.235015869140625, 1.40594482421875, 1.576873779296875, 1.747802734375, 1.918731689453125, 2.08966064453125, 2.260589599609375, 2.4315185546875, 2.602447509765625, 2.77337646484375, 2.944305419921875, 3.115234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 8.0, 14.0, 14.0, 15.0, 13.0, 21.0, 24.0, 30.0, 45.0, 51.0, 30.0, 45.0, 49.0, 50.0, 51.0, 49.0, 46.0, 46.0, 51.0, 35.0, 41.0, 45.0, 33.0, 37.0, 26.0, 22.0, 9.0, 11.0, 15.0, 11.0, 11.0, 9.0, 1.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.60986328125, -0.5930099487304688, -0.5761566162109375, -0.5593032836914062, -0.542449951171875, -0.5255966186523438, -0.5087432861328125, -0.49188995361328125, -0.47503662109375, -0.45818328857421875, -0.4413299560546875, -0.42447662353515625, -0.407623291015625, -0.39076995849609375, -0.3739166259765625, -0.35706329345703125, -0.3402099609375, -0.32335662841796875, -0.3065032958984375, -0.28964996337890625, -0.272796630859375, -0.25594329833984375, -0.2390899658203125, -0.22223663330078125, -0.20538330078125, -0.18852996826171875, -0.1716766357421875, -0.15482330322265625, -0.137969970703125, -0.12111663818359375, -0.1042633056640625, -0.08740997314453125, -0.070556640625, -0.05370330810546875, -0.0368499755859375, -0.01999664306640625, -0.003143310546875, 0.01371002197265625, 0.0305633544921875, 0.04741668701171875, 0.06427001953125, 0.08112335205078125, 0.0979766845703125, 0.11483001708984375, 0.131683349609375, 0.14853668212890625, 0.1653900146484375, 0.18224334716796875, 0.1990966796875, 0.21595001220703125, 0.2328033447265625, 0.24965667724609375, 0.266510009765625, 0.28336334228515625, 0.3002166748046875, 0.31707000732421875, 0.33392333984375, 0.35077667236328125, 0.3676300048828125, 0.38448333740234375, 0.401336669921875, 0.41819000244140625, 0.4350433349609375, 0.45189666748046875, 0.46875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 7.0, 10.0, 14.0, 12.0, 21.0, 32.0, 46.0, 62.0, 95.0, 143.0, 228.0, 416.0, 706.0, 1391.0, 3121.0, 8290.0, 31716.0, 3795295.0, 316725.0, 23716.0, 6766.0, 2604.0, 1200.0, 657.0, 341.0, 213.0, 152.0, 94.0, 47.0, 39.0, 29.0, 19.0, 6.0, 10.0, 13.0, 6.0, 6.0, 5.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.221405029296875, -3.12640380859375, -3.031402587890625, -2.9364013671875, -2.841400146484375, -2.74639892578125, -2.651397705078125, -2.556396484375, -2.461395263671875, -2.36639404296875, -2.271392822265625, -2.1763916015625, -2.081390380859375, -1.98638916015625, -1.891387939453125, -1.79638671875, -1.701385498046875, -1.60638427734375, -1.511383056640625, -1.4163818359375, -1.321380615234375, -1.22637939453125, -1.131378173828125, -1.036376953125, -0.941375732421875, -0.84637451171875, -0.751373291015625, -0.6563720703125, -0.561370849609375, -0.46636962890625, -0.371368408203125, -0.2763671875, -0.181365966796875, -0.08636474609375, 0.008636474609375, 0.1036376953125, 0.198638916015625, 0.29364013671875, 0.388641357421875, 0.483642578125, 0.578643798828125, 0.67364501953125, 0.768646240234375, 0.8636474609375, 0.958648681640625, 1.05364990234375, 1.148651123046875, 1.24365234375, 1.338653564453125, 1.43365478515625, 1.528656005859375, 1.6236572265625, 1.718658447265625, 1.81365966796875, 1.908660888671875, 2.003662109375, 2.098663330078125, 2.19366455078125, 2.288665771484375, 2.3836669921875, 2.478668212890625, 2.57366943359375, 2.668670654296875, 2.763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 10.0, 8.0, 6.0, 5.0, 21.0, 32.0, 54.0, 215.0, 3421.0, 179.0, 51.0, 22.0, 23.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8113784790039062, -0.7902374267578125, -0.7690963745117188, -0.747955322265625, -0.7268142700195312, -0.7056732177734375, -0.6845321655273438, -0.66339111328125, -0.6422500610351562, -0.6211090087890625, -0.5999679565429688, -0.578826904296875, -0.5576858520507812, -0.5365447998046875, -0.5154037475585938, -0.4942626953125, -0.47312164306640625, -0.4519805908203125, -0.43083953857421875, -0.409698486328125, -0.38855743408203125, -0.3674163818359375, -0.34627532958984375, -0.32513427734375, -0.30399322509765625, -0.2828521728515625, -0.26171112060546875, -0.240570068359375, -0.21942901611328125, -0.1982879638671875, -0.17714691162109375, -0.156005859375, -0.13486480712890625, -0.1137237548828125, -0.09258270263671875, -0.071441650390625, -0.05030059814453125, -0.0291595458984375, -0.00801849365234375, 0.01312255859375, 0.03426361083984375, 0.0554046630859375, 0.07654571533203125, 0.097686767578125, 0.11882781982421875, 0.1399688720703125, 0.16110992431640625, 0.1822509765625, 0.20339202880859375, 0.2245330810546875, 0.24567413330078125, 0.266815185546875, 0.28795623779296875, 0.3090972900390625, 0.33023834228515625, 0.35137939453125, 0.37252044677734375, 0.3936614990234375, 0.41480255126953125, 0.435943603515625, 0.45708465576171875, 0.4782257080078125, 0.49936676025390625, 0.5205078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 4.0, 6.0, 14.0, 28.0, 40.0, 60.0, 120.0, 147.0, 166.0, 134.0, 124.0, 76.0, 40.0, 22.0, 11.0, 3.0, 6.0, 6.0, 2.0, 2.0], "bins": [-4.905620574951172, -4.812600135803223, -4.719579696655273, -4.626559257507324, -4.533538341522217, -4.440517902374268, -4.347497463226318, -4.254477024078369, -4.16145658493042, -4.068436145782471, -3.9754154682159424, -3.882395029067993, -3.789374589920044, -3.6963541507720947, -3.6033334732055664, -3.510313034057617, -3.417292594909668, -3.3242721557617188, -3.2312514781951904, -3.138231039047241, -3.045210599899292, -2.9521901607513428, -2.8591694831848145, -2.7661490440368652, -2.673128366470337, -2.5801079273223877, -2.4870872497558594, -2.39406681060791, -2.301046371459961, -2.2080259323120117, -2.1150052547454834, -2.021984815597534, -1.928964376449585, -1.8359438180923462, -1.742923378944397, -1.6499028205871582, -1.556882381439209, -1.4638618230819702, -1.3708412647247314, -1.2778208255767822, -1.184800386428833, -1.0917798280715942, -0.998759388923645, -0.9057388305664062, -0.812718391418457, -0.7196978330612183, -0.6266773343086243, -0.5336568355560303, -0.4406362771987915, -0.3476157784461975, -0.2545952796936035, -0.16157475113868713, -0.06855425238609314, 0.024466246366500854, 0.11748677492141724, 0.21050727367401123, 0.3035277724266052, 0.3965482711791992, 0.4895687699317932, 0.5825892686843872, 0.675609827041626, 0.7686302661895752, 0.861650824546814, 0.954671323299408, 1.047691822052002]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 8.0, 20.0, 10.0, 10.0, 9.0, 16.0, 23.0, 26.0, 32.0, 34.0, 29.0, 46.0, 40.0, 35.0, 34.0, 61.0, 46.0, 56.0, 40.0, 38.0, 49.0, 43.0, 30.0, 36.0, 31.0, 31.0, 23.0, 18.0, 18.0, 23.0, 18.0, 7.0, 9.0, 7.0, 5.0, 12.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1453073024749756, -1.1123360395431519, -1.0793648958206177, -1.046393632888794, -1.0134224891662598, -0.980451226234436, -0.9474800229072571, -0.9145088195800781, -0.8815376162528992, -0.8485664129257202, -0.8155952095985413, -0.7826240062713623, -0.7496527433395386, -0.7166815996170044, -0.6837103366851807, -0.6507391333580017, -0.6177679300308228, -0.5847967267036438, -0.5518255233764648, -0.5188543200492859, -0.48588308691978455, -0.4529118835926056, -0.41994065046310425, -0.3869694471359253, -0.35399824380874634, -0.3210270404815674, -0.2880558371543884, -0.2550846040248871, -0.22211340069770813, -0.18914219737052917, -0.15617097914218903, -0.12319976091384888, -0.09022867679595947, -0.05725746601819992, -0.02428625524044037, 0.008684955537319183, 0.041656166315078735, 0.07462736964225769, 0.10759858787059784, 0.140569806098938, 0.17354100942611694, 0.2065122127532959, 0.23948343098163605, 0.2724546492099762, 0.30542585253715515, 0.3383970558643341, 0.37136828899383545, 0.4043394923210144, 0.43731069564819336, 0.4702818989753723, 0.5032531023025513, 0.5362243056297302, 0.5691955089569092, 0.6021667718887329, 0.6351379752159119, 0.6681091785430908, 0.7010803818702698, 0.7340515851974487, 0.7670227885246277, 0.7999939918518066, 0.8329652547836304, 0.8659363985061646, 0.8989076614379883, 0.9318788647651672, 0.9648500680923462]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 10.0, 24.0, 23.0, 36.0, 52.0, 84.0, 195.0, 436.0, 970.0, 2413.0, 6829.0, 22070.0, 78555.0, 269174.0, 419266.0, 177908.0, 48562.0, 14148.0, 4646.0, 1737.0, 703.0, 333.0, 141.0, 89.0, 47.0, 29.0, 12.0, 13.0, 7.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.509765625, -2.42962646484375, -2.3494873046875, -2.26934814453125, -2.189208984375, -2.10906982421875, -2.0289306640625, -1.94879150390625, -1.86865234375, -1.78851318359375, -1.7083740234375, -1.62823486328125, -1.548095703125, -1.46795654296875, -1.3878173828125, -1.30767822265625, -1.2275390625, -1.14739990234375, -1.0672607421875, -0.98712158203125, -0.906982421875, -0.82684326171875, -0.7467041015625, -0.66656494140625, -0.58642578125, -0.50628662109375, -0.4261474609375, -0.34600830078125, -0.265869140625, -0.18572998046875, -0.1055908203125, -0.02545166015625, 0.0546875, 0.13482666015625, 0.2149658203125, 0.29510498046875, 0.375244140625, 0.45538330078125, 0.5355224609375, 0.61566162109375, 0.69580078125, 0.77593994140625, 0.8560791015625, 0.93621826171875, 1.016357421875, 1.09649658203125, 1.1766357421875, 1.25677490234375, 1.3369140625, 1.41705322265625, 1.4971923828125, 1.57733154296875, 1.657470703125, 1.73760986328125, 1.8177490234375, 1.89788818359375, 1.97802734375, 2.05816650390625, 2.1383056640625, 2.21844482421875, 2.298583984375, 2.37872314453125, 2.4588623046875, 2.53900146484375, 2.619140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 5.0, 9.0, 5.0, 19.0, 9.0, 17.0, 20.0, 19.0, 34.0, 29.0, 26.0, 44.0, 35.0, 44.0, 49.0, 48.0, 43.0, 46.0, 37.0, 45.0, 49.0, 40.0, 40.0, 38.0, 41.0, 29.0, 33.0, 30.0, 22.0, 14.0, 16.0, 13.0, 13.0, 10.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6240234375, -0.6060409545898438, -0.5880584716796875, -0.5700759887695312, -0.552093505859375, -0.5341110229492188, -0.5161285400390625, -0.49814605712890625, -0.48016357421875, -0.46218109130859375, -0.4441986083984375, -0.42621612548828125, -0.408233642578125, -0.39025115966796875, -0.3722686767578125, -0.35428619384765625, -0.3363037109375, -0.31832122802734375, -0.3003387451171875, -0.28235626220703125, -0.264373779296875, -0.24639129638671875, -0.2284088134765625, -0.21042633056640625, -0.19244384765625, -0.17446136474609375, -0.1564788818359375, -0.13849639892578125, -0.120513916015625, -0.10253143310546875, -0.0845489501953125, -0.06656646728515625, -0.048583984375, -0.03060150146484375, -0.0126190185546875, 0.00536346435546875, 0.023345947265625, 0.04132843017578125, 0.0593109130859375, 0.07729339599609375, 0.09527587890625, 0.11325836181640625, 0.1312408447265625, 0.14922332763671875, 0.167205810546875, 0.18518829345703125, 0.2031707763671875, 0.22115325927734375, 0.2391357421875, 0.25711822509765625, 0.2751007080078125, 0.29308319091796875, 0.311065673828125, 0.32904815673828125, 0.3470306396484375, 0.36501312255859375, 0.38299560546875, 0.40097808837890625, 0.4189605712890625, 0.43694305419921875, 0.454925537109375, 0.47290802001953125, 0.4908905029296875, 0.5088729858398438, 0.52685546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 13.0, 13.0, 34.0, 27.0, 67.0, 76.0, 158.0, 203.0, 385.0, 765.0, 1376.0, 2657.0, 5655.0, 12495.0, 29933.0, 76586.0, 199486.0, 374617.0, 208500.0, 79083.0, 31016.0, 13309.0, 5953.0, 2829.0, 1446.0, 758.0, 435.0, 246.0, 167.0, 94.0, 42.0, 35.0, 22.0, 13.0, 13.0, 15.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.64453125, -1.5923614501953125, -1.540191650390625, -1.4880218505859375, -1.43585205078125, -1.3836822509765625, -1.331512451171875, -1.2793426513671875, -1.2271728515625, -1.1750030517578125, -1.122833251953125, -1.0706634521484375, -1.01849365234375, -0.9663238525390625, -0.914154052734375, -0.8619842529296875, -0.809814453125, -0.7576446533203125, -0.705474853515625, -0.6533050537109375, -0.60113525390625, -0.5489654541015625, -0.496795654296875, -0.4446258544921875, -0.3924560546875, -0.3402862548828125, -0.288116455078125, -0.2359466552734375, -0.18377685546875, -0.1316070556640625, -0.079437255859375, -0.0272674560546875, 0.02490234375, 0.0770721435546875, 0.129241943359375, 0.1814117431640625, 0.23358154296875, 0.2857513427734375, 0.337921142578125, 0.3900909423828125, 0.4422607421875, 0.4944305419921875, 0.546600341796875, 0.5987701416015625, 0.65093994140625, 0.7031097412109375, 0.755279541015625, 0.8074493408203125, 0.859619140625, 0.9117889404296875, 0.963958740234375, 1.0161285400390625, 1.06829833984375, 1.1204681396484375, 1.172637939453125, 1.2248077392578125, 1.2769775390625, 1.3291473388671875, 1.381317138671875, 1.4334869384765625, 1.48565673828125, 1.5378265380859375, 1.589996337890625, 1.6421661376953125, 1.6943359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 10.0, 15.0, 28.0, 21.0, 22.0, 21.0, 49.0, 34.0, 37.0, 58.0, 49.0, 56.0, 63.0, 51.0, 65.0, 54.0, 46.0, 42.0, 43.0, 38.0, 32.0, 24.0, 22.0, 23.0, 15.0, 8.0, 11.0, 13.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.173828125, -3.056732177734375, -2.93963623046875, -2.822540283203125, -2.7054443359375, -2.588348388671875, -2.47125244140625, -2.354156494140625, -2.237060546875, -2.119964599609375, -2.00286865234375, -1.885772705078125, -1.7686767578125, -1.651580810546875, -1.53448486328125, -1.417388916015625, -1.30029296875, -1.183197021484375, -1.06610107421875, -0.949005126953125, -0.8319091796875, -0.714813232421875, -0.59771728515625, -0.480621337890625, -0.363525390625, -0.246429443359375, -0.12933349609375, -0.012237548828125, 0.1048583984375, 0.221954345703125, 0.33905029296875, 0.456146240234375, 0.5732421875, 0.690338134765625, 0.80743408203125, 0.924530029296875, 1.0416259765625, 1.158721923828125, 1.27581787109375, 1.392913818359375, 1.510009765625, 1.627105712890625, 1.74420166015625, 1.861297607421875, 1.9783935546875, 2.095489501953125, 2.21258544921875, 2.329681396484375, 2.44677734375, 2.563873291015625, 2.68096923828125, 2.798065185546875, 2.9151611328125, 3.032257080078125, 3.14935302734375, 3.266448974609375, 3.383544921875, 3.500640869140625, 3.61773681640625, 3.734832763671875, 3.8519287109375, 3.969024658203125, 4.08612060546875, 4.203216552734375, 4.3203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 17.0, 31.0, 53.0, 87.0, 172.0, 412.0, 1173.0, 6321.0, 199505.0, 825101.0, 12858.0, 1851.0, 494.0, 213.0, 95.0, 57.0, 48.0, 16.0, 6.0, 13.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.5078125, -4.36761474609375, -4.2274169921875, -4.08721923828125, -3.947021484375, -3.80682373046875, -3.6666259765625, -3.52642822265625, -3.38623046875, -3.24603271484375, -3.1058349609375, -2.96563720703125, -2.825439453125, -2.68524169921875, -2.5450439453125, -2.40484619140625, -2.2646484375, -2.12445068359375, -1.9842529296875, -1.84405517578125, -1.703857421875, -1.56365966796875, -1.4234619140625, -1.28326416015625, -1.14306640625, -1.00286865234375, -0.8626708984375, -0.72247314453125, -0.582275390625, -0.44207763671875, -0.3018798828125, -0.16168212890625, -0.021484375, 0.11871337890625, 0.2589111328125, 0.39910888671875, 0.539306640625, 0.67950439453125, 0.8197021484375, 0.95989990234375, 1.10009765625, 1.24029541015625, 1.3804931640625, 1.52069091796875, 1.660888671875, 1.80108642578125, 1.9412841796875, 2.08148193359375, 2.2216796875, 2.36187744140625, 2.5020751953125, 2.64227294921875, 2.782470703125, 2.92266845703125, 3.0628662109375, 3.20306396484375, 3.34326171875, 3.48345947265625, 3.6236572265625, 3.76385498046875, 3.904052734375, 4.04425048828125, 4.1844482421875, 4.32464599609375, 4.46484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 16.0, 27.0, 25.0, 43.0, 58.0, 83.0, 91.0, 136.0, 119.0, 100.0, 104.0, 66.0, 29.0, 30.0, 24.0, 16.0, 8.0, 8.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00013963505625724792, -0.00013192743062973022, -0.00012421980500221252, -0.00011651217937469482, -0.00010880455374717712, -0.00010109692811965942, -9.338930249214172e-05, -8.568167686462402e-05, -7.797405123710632e-05, -7.026642560958862e-05, -6.255879998207092e-05, -5.485117435455322e-05, -4.714354872703552e-05, -3.943592309951782e-05, -3.172829747200012e-05, -2.4020671844482422e-05, -1.631304621696472e-05, -8.605420589447021e-06, -8.977949619293213e-07, 6.809830665588379e-06, 1.4517456293106079e-05, 2.222508192062378e-05, 2.993270754814148e-05, 3.764033317565918e-05, 4.534795880317688e-05, 5.305558443069458e-05, 6.076321005821228e-05, 6.847083568572998e-05, 7.617846131324768e-05, 8.388608694076538e-05, 9.159371256828308e-05, 9.930133819580078e-05, 0.00010700896382331848, 0.00011471658945083618, 0.00012242421507835388, 0.00013013184070587158, 0.00013783946633338928, 0.00014554709196090698, 0.00015325471758842468, 0.00016096234321594238, 0.00016866996884346008, 0.00017637759447097778, 0.00018408522009849548, 0.00019179284572601318, 0.00019950047135353088, 0.00020720809698104858, 0.00021491572260856628, 0.00022262334823608398, 0.00023033097386360168, 0.00023803859949111938, 0.0002457462251186371, 0.0002534538507461548, 0.0002611614763736725, 0.0002688691020011902, 0.0002765767276287079, 0.0002842843532562256, 0.0002919919788837433, 0.000299699604511261, 0.0003074072301387787, 0.0003151148557662964, 0.0003228224813938141, 0.0003305301070213318, 0.0003382377326488495, 0.0003459453582763672]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 27.0, 41.0, 91.0, 221.0, 678.0, 2332.0, 12879.0, 325334.0, 681136.0, 21214.0, 3222.0, 845.0, 294.0, 102.0, 62.0, 24.0, 9.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.31585693359375, -3.2156982421875, -3.11553955078125, -3.015380859375, -2.91522216796875, -2.8150634765625, -2.71490478515625, -2.61474609375, -2.51458740234375, -2.4144287109375, -2.31427001953125, -2.214111328125, -2.11395263671875, -2.0137939453125, -1.91363525390625, -1.8134765625, -1.71331787109375, -1.6131591796875, -1.51300048828125, -1.412841796875, -1.31268310546875, -1.2125244140625, -1.11236572265625, -1.01220703125, -0.91204833984375, -0.8118896484375, -0.71173095703125, -0.611572265625, -0.51141357421875, -0.4112548828125, -0.31109619140625, -0.2109375, -0.11077880859375, -0.0106201171875, 0.08953857421875, 0.189697265625, 0.28985595703125, 0.3900146484375, 0.49017333984375, 0.59033203125, 0.69049072265625, 0.7906494140625, 0.89080810546875, 0.990966796875, 1.09112548828125, 1.1912841796875, 1.29144287109375, 1.3916015625, 1.49176025390625, 1.5919189453125, 1.69207763671875, 1.792236328125, 1.89239501953125, 1.9925537109375, 2.09271240234375, 2.19287109375, 2.29302978515625, 2.3931884765625, 2.49334716796875, 2.593505859375, 2.69366455078125, 2.7938232421875, 2.89398193359375, 2.994140625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 10.0, 6.0, 9.0, 20.0, 32.0, 85.0, 142.0, 204.0, 230.0, 118.0, 61.0, 31.0, 18.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.546875, -4.42962646484375, -4.3123779296875, -4.19512939453125, -4.077880859375, -3.96063232421875, -3.8433837890625, -3.72613525390625, -3.60888671875, -3.49163818359375, -3.3743896484375, -3.25714111328125, -3.139892578125, -3.02264404296875, -2.9053955078125, -2.78814697265625, -2.6708984375, -2.55364990234375, -2.4364013671875, -2.31915283203125, -2.201904296875, -2.08465576171875, -1.9674072265625, -1.85015869140625, -1.73291015625, -1.61566162109375, -1.4984130859375, -1.38116455078125, -1.263916015625, -1.14666748046875, -1.0294189453125, -0.91217041015625, -0.794921875, -0.67767333984375, -0.5604248046875, -0.44317626953125, -0.325927734375, -0.20867919921875, -0.0914306640625, 0.02581787109375, 0.14306640625, 0.26031494140625, 0.3775634765625, 0.49481201171875, 0.612060546875, 0.72930908203125, 0.8465576171875, 0.96380615234375, 1.0810546875, 1.19830322265625, 1.3155517578125, 1.43280029296875, 1.550048828125, 1.66729736328125, 1.7845458984375, 1.90179443359375, 2.01904296875, 2.13629150390625, 2.2535400390625, 2.37078857421875, 2.488037109375, 2.60528564453125, 2.7225341796875, 2.83978271484375, 2.95703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 14.0, 28.0, 74.0, 170.0, 270.0, 231.0, 144.0, 60.0, 12.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5616569519043, -31.949108123779297, -30.336559295654297, -28.724008560180664, -27.111459732055664, -25.498910903930664, -23.88636016845703, -22.27381134033203, -20.66126251220703, -19.04871368408203, -17.43616485595703, -15.823614120483398, -14.211065292358398, -12.598516464233398, -10.985966682434082, -9.373416900634766, -7.760868072509766, -6.148318767547607, -4.535769462585449, -2.923220157623291, -1.3106708526611328, 0.3018779754638672, 1.9144277572631836, 3.5269775390625, 5.1395263671875, 6.752075672149658, 8.364624977111816, 9.977174758911133, 11.589723587036133, 13.202272415161133, 14.81482219696045, 16.427371978759766, 18.03992462158203, 19.65247344970703, 21.26502227783203, 22.877573013305664, 24.490121841430664, 26.102670669555664, 27.715221405029297, 29.327770233154297, 30.940319061279297, 32.5528678894043, 34.1654167175293, 35.7779655456543, 37.39051818847656, 39.00306701660156, 40.61561584472656, 42.22816467285156, 43.84071350097656, 45.45326232910156, 47.06581115722656, 48.67835998535156, 50.29090881347656, 51.90345764160156, 53.51601028442383, 55.12855911254883, 56.74110794067383, 58.35365676879883, 59.96620559692383, 61.57875442504883, 63.191307067871094, 64.8038558959961, 66.4164047241211, 68.0289535522461, 69.6415023803711]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 0.0, 10.0, 9.0, 7.0, 10.0, 11.0, 17.0, 15.0, 19.0, 27.0, 25.0, 17.0, 27.0, 33.0, 44.0, 52.0, 44.0, 47.0, 39.0, 48.0, 60.0, 47.0, 57.0, 43.0, 29.0, 39.0, 28.0, 22.0, 24.0, 18.0, 21.0, 28.0, 18.0, 6.0, 12.0, 10.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.513343811035156, -16.96009635925293, -16.40684700012207, -15.853599548339844, -15.300352096557617, -14.747103691101074, -14.193855285644531, -13.640607833862305, -13.087359428405762, -12.534111022949219, -11.980863571166992, -11.42761516571045, -10.874366760253906, -10.32111930847168, -9.767870903015137, -9.214622497558594, -8.661375045776367, -8.108126640319824, -7.554879188537598, -7.001630783081055, -6.44838285446167, -5.895134925842285, -5.341886520385742, -4.788638591766357, -4.235390663146973, -3.682142734527588, -3.128894567489624, -2.57564640045166, -2.0223984718322754, -1.4691505432128906, -0.9159023761749268, -0.3626542091369629, 0.19059371948242188, 0.7438417673110962, 1.2970898151397705, 1.8503378629684448, 2.403585910797119, 2.956833839416504, 3.5100820064544678, 4.063330173492432, 4.616578102111816, 5.169826030731201, 5.723073959350586, 6.276322364807129, 6.829570293426514, 7.382818222045898, 7.936066627502441, 8.489315032958984, 9.042562484741211, 9.595810890197754, 10.14905834197998, 10.702306747436523, 11.25555419921875, 11.808802604675293, 12.362051010131836, 12.915298461914062, 13.468546867370605, 14.021795272827148, 14.575042724609375, 15.128291130065918, 15.681539535522461, 16.234786987304688, 16.788034439086914, 17.341283798217773, 17.89453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 15.0, 17.0, 36.0, 69.0, 151.0, 405.0, 1382.0, 7261.0, 4007031.0, 170849.0, 5407.0, 1052.0, 340.0, 128.0, 53.0, 34.0, 14.0, 8.0, 10.0, 1.0, 8.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.453125, -13.1536865234375, -12.854248046875, -12.5548095703125, -12.25537109375, -11.9559326171875, -11.656494140625, -11.3570556640625, -11.0576171875, -10.7581787109375, -10.458740234375, -10.1593017578125, -9.85986328125, -9.5604248046875, -9.260986328125, -8.9615478515625, -8.662109375, -8.3626708984375, -8.063232421875, -7.7637939453125, -7.46435546875, -7.1649169921875, -6.865478515625, -6.5660400390625, -6.2666015625, -5.9671630859375, -5.667724609375, -5.3682861328125, -5.06884765625, -4.7694091796875, -4.469970703125, -4.1705322265625, -3.87109375, -3.5716552734375, -3.272216796875, -2.9727783203125, -2.67333984375, -2.3739013671875, -2.074462890625, -1.7750244140625, -1.4755859375, -1.1761474609375, -0.876708984375, -0.5772705078125, -0.27783203125, 0.0216064453125, 0.321044921875, 0.6204833984375, 0.919921875, 1.2193603515625, 1.518798828125, 1.8182373046875, 2.11767578125, 2.4171142578125, 2.716552734375, 3.0159912109375, 3.3154296875, 3.6148681640625, 3.914306640625, 4.2137451171875, 4.51318359375, 4.8126220703125, 5.112060546875, 5.4114990234375, 5.7109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 6.0, 9.0, 4.0, 7.0, 14.0, 23.0, 22.0, 27.0, 36.0, 31.0, 32.0, 57.0, 54.0, 42.0, 45.0, 56.0, 46.0, 53.0, 60.0, 54.0, 43.0, 43.0, 48.0, 33.0, 25.0, 22.0, 20.0, 11.0, 13.0, 8.0, 12.0, 7.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.87548828125, -0.849853515625, -0.82421875, -0.798583984375, -0.77294921875, -0.747314453125, -0.7216796875, -0.696044921875, -0.67041015625, -0.644775390625, -0.619140625, -0.593505859375, -0.56787109375, -0.542236328125, -0.5166015625, -0.490966796875, -0.46533203125, -0.439697265625, -0.4140625, -0.388427734375, -0.36279296875, -0.337158203125, -0.3115234375, -0.285888671875, -0.26025390625, -0.234619140625, -0.208984375, -0.183349609375, -0.15771484375, -0.132080078125, -0.1064453125, -0.080810546875, -0.05517578125, -0.029541015625, -0.00390625, 0.021728515625, 0.04736328125, 0.072998046875, 0.0986328125, 0.124267578125, 0.14990234375, 0.175537109375, 0.201171875, 0.226806640625, 0.25244140625, 0.278076171875, 0.3037109375, 0.329345703125, 0.35498046875, 0.380615234375, 0.40625, 0.431884765625, 0.45751953125, 0.483154296875, 0.5087890625, 0.534423828125, 0.56005859375, 0.585693359375, 0.611328125, 0.636962890625, 0.66259765625, 0.688232421875, 0.7138671875, 0.739501953125, 0.76513671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 8.0, 10.0, 23.0, 19.0, 35.0, 53.0, 71.0, 99.0, 155.0, 220.0, 320.0, 536.0, 815.0, 1297.0, 2004.0, 3446.0, 6132.0, 12130.0, 32057.0, 140761.0, 3827171.0, 112899.0, 28401.0, 11456.0, 5677.0, 3157.0, 1838.0, 1246.0, 725.0, 506.0, 306.0, 203.0, 143.0, 114.0, 74.0, 56.0, 34.0, 32.0, 18.0, 9.0, 4.0, 10.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.387664794921875, -2.30657958984375, -2.225494384765625, -2.1444091796875, -2.063323974609375, -1.98223876953125, -1.901153564453125, -1.820068359375, -1.738983154296875, -1.65789794921875, -1.576812744140625, -1.4957275390625, -1.414642333984375, -1.33355712890625, -1.252471923828125, -1.17138671875, -1.090301513671875, -1.00921630859375, -0.928131103515625, -0.8470458984375, -0.765960693359375, -0.68487548828125, -0.603790283203125, -0.522705078125, -0.441619873046875, -0.36053466796875, -0.279449462890625, -0.1983642578125, -0.117279052734375, -0.03619384765625, 0.044891357421875, 0.1259765625, 0.207061767578125, 0.28814697265625, 0.369232177734375, 0.4503173828125, 0.531402587890625, 0.61248779296875, 0.693572998046875, 0.774658203125, 0.855743408203125, 0.93682861328125, 1.017913818359375, 1.0989990234375, 1.180084228515625, 1.26116943359375, 1.342254638671875, 1.42333984375, 1.504425048828125, 1.58551025390625, 1.666595458984375, 1.7476806640625, 1.828765869140625, 1.90985107421875, 1.990936279296875, 2.072021484375, 2.153106689453125, 2.23419189453125, 2.315277099609375, 2.3963623046875, 2.477447509765625, 2.55853271484375, 2.639617919921875, 2.720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 10.0, 11.0, 11.0, 16.0, 18.0, 37.0, 56.0, 156.0, 2979.0, 487.0, 105.0, 56.0, 34.0, 31.0, 15.0, 4.0, 8.0, 2.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.984375, -0.9576873779296875, -0.930999755859375, -0.9043121337890625, -0.87762451171875, -0.8509368896484375, -0.824249267578125, -0.7975616455078125, -0.7708740234375, -0.7441864013671875, -0.717498779296875, -0.6908111572265625, -0.66412353515625, -0.6374359130859375, -0.610748291015625, -0.5840606689453125, -0.557373046875, -0.5306854248046875, -0.503997802734375, -0.4773101806640625, -0.45062255859375, -0.4239349365234375, -0.397247314453125, -0.3705596923828125, -0.3438720703125, -0.3171844482421875, -0.290496826171875, -0.2638092041015625, -0.23712158203125, -0.2104339599609375, -0.183746337890625, -0.1570587158203125, -0.13037109375, -0.1036834716796875, -0.076995849609375, -0.0503082275390625, -0.02362060546875, 0.0030670166015625, 0.029754638671875, 0.0564422607421875, 0.0831298828125, 0.1098175048828125, 0.136505126953125, 0.1631927490234375, 0.18988037109375, 0.2165679931640625, 0.243255615234375, 0.2699432373046875, 0.296630859375, 0.3233184814453125, 0.350006103515625, 0.3766937255859375, 0.40338134765625, 0.4300689697265625, 0.456756591796875, 0.4834442138671875, 0.5101318359375, 0.5368194580078125, 0.563507080078125, 0.5901947021484375, 0.61688232421875, 0.6435699462890625, 0.670257568359375, 0.6969451904296875, 0.7236328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 17.0, 29.0, 39.0, 64.0, 102.0, 127.0, 147.0, 131.0, 107.0, 69.0, 60.0, 36.0, 36.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.696760654449463, -6.558041572570801, -6.419322490692139, -6.280602931976318, -6.141883850097656, -6.003164768218994, -5.864445686340332, -5.72572660446167, -5.587007522583008, -5.448288440704346, -5.309569358825684, -5.170849800109863, -5.032130718231201, -4.893411636352539, -4.754692554473877, -4.615973472595215, -4.4772539138793945, -4.338534832000732, -4.19981575012207, -4.06109619140625, -3.922377109527588, -3.783658027648926, -3.6449389457702637, -3.5062198638916016, -3.3675005435943604, -3.2287814617156982, -3.090062141418457, -2.951343059539795, -2.812623977661133, -2.6739046573638916, -2.5351855754852295, -2.3964662551879883, -2.2577476501464844, -2.1190285682678223, -1.980309247970581, -1.841590166091919, -1.7028709650039673, -1.5641517639160156, -1.4254326820373535, -1.2867134809494019, -1.1479942798614502, -1.0092750787734985, -0.8705559372901917, -0.7318367958068848, -0.5931175947189331, -0.45439839363098145, -0.31567925214767456, -0.17696011066436768, -0.038240909576416016, 0.10047826170921326, 0.23919743299484253, 0.3779166042804718, 0.5166357755661011, 0.6553549766540527, 0.7940741181373596, 0.9327932596206665, 1.0715124607086182, 1.2102316617965698, 1.3489508628845215, 1.4876699447631836, 1.6263891458511353, 1.765108346939087, 1.903827428817749, 2.0425467491149902, 2.1812658309936523]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 13.0, 12.0, 15.0, 21.0, 17.0, 25.0, 24.0, 34.0, 23.0, 38.0, 34.0, 48.0, 47.0, 49.0, 47.0, 55.0, 40.0, 47.0, 55.0, 41.0, 39.0, 39.0, 44.0, 22.0, 23.0, 23.0, 13.0, 15.0, 15.0, 14.0, 20.0, 11.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8557887077331543, -1.7828123569488525, -1.7098360061645508, -1.636859655380249, -1.5638831853866577, -1.490906834602356, -1.4179304838180542, -1.344954013824463, -1.2719776630401611, -1.1990013122558594, -1.1260249614715576, -1.0530486106872559, -0.9800721406936646, -0.9070957899093628, -0.834119439125061, -0.7611430287361145, -0.6881667375564575, -0.6151903867721558, -0.5422139763832092, -0.46923762559890747, -0.3962612450122833, -0.3232848644256592, -0.2503085136413574, -0.1773321032524109, -0.10435575246810913, -0.03137937933206558, 0.041596993803977966, 0.11457335948944092, 0.18754974007606506, 0.2605261206626892, 0.33350247144699097, 0.4064788818359375, 0.47945523262023926, 0.552431583404541, 0.6254079937934875, 0.6983843445777893, 0.7713607549667358, 0.8443371057510376, 0.9173134565353394, 0.9902898669242859, 1.0632662773132324, 1.1362426280975342, 1.209218978881836, 1.2821953296661377, 1.355171799659729, 1.4281481504440308, 1.5011245012283325, 1.5741009712219238, 1.647077202796936, 1.7200535535812378, 1.7930299043655396, 1.8660063743591309, 1.9389827251434326, 2.0119590759277344, 2.084935426712036, 2.157911777496338, 2.2308881282806396, 2.3038644790649414, 2.376840829849243, 2.449817180633545, 2.5227935314178467, 2.5957698822021484, 2.6687464714050293, 2.741722822189331, 2.814699172973633]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 17.0, 12.0, 17.0, 22.0, 25.0, 58.0, 146.0, 256.0, 681.0, 1589.0, 4692.0, 15615.0, 61018.0, 257586.0, 470802.0, 177988.0, 41372.0, 10917.0, 3424.0, 1258.0, 582.0, 236.0, 96.0, 62.0, 34.0, 10.0, 14.0, 9.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.658233642578125, -2.56451416015625, -2.470794677734375, -2.3770751953125, -2.283355712890625, -2.18963623046875, -2.095916748046875, -2.002197265625, -1.908477783203125, -1.81475830078125, -1.721038818359375, -1.6273193359375, -1.533599853515625, -1.43988037109375, -1.346160888671875, -1.25244140625, -1.158721923828125, -1.06500244140625, -0.971282958984375, -0.8775634765625, -0.783843994140625, -0.69012451171875, -0.596405029296875, -0.502685546875, -0.408966064453125, -0.31524658203125, -0.221527099609375, -0.1278076171875, -0.034088134765625, 0.05963134765625, 0.153350830078125, 0.2470703125, 0.340789794921875, 0.43450927734375, 0.528228759765625, 0.6219482421875, 0.715667724609375, 0.80938720703125, 0.903106689453125, 0.996826171875, 1.090545654296875, 1.18426513671875, 1.277984619140625, 1.3717041015625, 1.465423583984375, 1.55914306640625, 1.652862548828125, 1.74658203125, 1.840301513671875, 1.93402099609375, 2.027740478515625, 2.1214599609375, 2.215179443359375, 2.30889892578125, 2.402618408203125, 2.496337890625, 2.590057373046875, 2.68377685546875, 2.777496337890625, 2.8712158203125, 2.964935302734375, 3.05865478515625, 3.152374267578125, 3.24609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 11.0, 11.0, 22.0, 20.0, 26.0, 34.0, 42.0, 26.0, 49.0, 47.0, 56.0, 53.0, 51.0, 48.0, 38.0, 61.0, 61.0, 44.0, 50.0, 36.0, 36.0, 36.0, 27.0, 13.0, 7.0, 10.0, 13.0, 7.0, 10.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.95166015625, -0.924560546875, -0.8974609375, -0.870361328125, -0.84326171875, -0.816162109375, -0.7890625, -0.761962890625, -0.73486328125, -0.707763671875, -0.6806640625, -0.653564453125, -0.62646484375, -0.599365234375, -0.572265625, -0.545166015625, -0.51806640625, -0.490966796875, -0.4638671875, -0.436767578125, -0.40966796875, -0.382568359375, -0.35546875, -0.328369140625, -0.30126953125, -0.274169921875, -0.2470703125, -0.219970703125, -0.19287109375, -0.165771484375, -0.138671875, -0.111572265625, -0.08447265625, -0.057373046875, -0.0302734375, -0.003173828125, 0.02392578125, 0.051025390625, 0.078125, 0.105224609375, 0.13232421875, 0.159423828125, 0.1865234375, 0.213623046875, 0.24072265625, 0.267822265625, 0.294921875, 0.322021484375, 0.34912109375, 0.376220703125, 0.4033203125, 0.430419921875, 0.45751953125, 0.484619140625, 0.51171875, 0.538818359375, 0.56591796875, 0.593017578125, 0.6201171875, 0.647216796875, 0.67431640625, 0.701416015625, 0.728515625, 0.755615234375, 0.78271484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 15.0, 23.0, 20.0, 59.0, 86.0, 168.0, 326.0, 798.0, 2198.0, 7265.0, 33364.0, 225980.0, 622885.0, 126617.0, 20822.0, 5080.0, 1557.0, 636.0, 266.0, 158.0, 78.0, 40.0, 31.0, 13.0, 8.0, 10.0, 14.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.103546142578125, -3.98052978515625, -3.857513427734375, -3.7344970703125, -3.611480712890625, -3.48846435546875, -3.365447998046875, -3.242431640625, -3.119415283203125, -2.99639892578125, -2.873382568359375, -2.7503662109375, -2.627349853515625, -2.50433349609375, -2.381317138671875, -2.25830078125, -2.135284423828125, -2.01226806640625, -1.889251708984375, -1.7662353515625, -1.643218994140625, -1.52020263671875, -1.397186279296875, -1.274169921875, -1.151153564453125, -1.02813720703125, -0.905120849609375, -0.7821044921875, -0.659088134765625, -0.53607177734375, -0.413055419921875, -0.2900390625, -0.167022705078125, -0.04400634765625, 0.079010009765625, 0.2020263671875, 0.325042724609375, 0.44805908203125, 0.571075439453125, 0.694091796875, 0.817108154296875, 0.94012451171875, 1.063140869140625, 1.1861572265625, 1.309173583984375, 1.43218994140625, 1.555206298828125, 1.67822265625, 1.801239013671875, 1.92425537109375, 2.047271728515625, 2.1702880859375, 2.293304443359375, 2.41632080078125, 2.539337158203125, 2.662353515625, 2.785369873046875, 2.90838623046875, 3.031402587890625, 3.1544189453125, 3.277435302734375, 3.40045166015625, 3.523468017578125, 3.646484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 30.0, 25.0, 35.0, 30.0, 44.0, 55.0, 64.0, 65.0, 63.0, 67.0, 60.0, 56.0, 68.0, 59.0, 48.0, 38.0, 37.0, 28.0, 21.0, 21.0, 16.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6973876953125, -5.515869140625, -5.3343505859375, -5.15283203125, -4.9713134765625, -4.789794921875, -4.6082763671875, -4.4267578125, -4.2452392578125, -4.063720703125, -3.8822021484375, -3.70068359375, -3.5191650390625, -3.337646484375, -3.1561279296875, -2.974609375, -2.7930908203125, -2.611572265625, -2.4300537109375, -2.24853515625, -2.0670166015625, -1.885498046875, -1.7039794921875, -1.5224609375, -1.3409423828125, -1.159423828125, -0.9779052734375, -0.79638671875, -0.6148681640625, -0.433349609375, -0.2518310546875, -0.0703125, 0.1112060546875, 0.292724609375, 0.4742431640625, 0.65576171875, 0.8372802734375, 1.018798828125, 1.2003173828125, 1.3818359375, 1.5633544921875, 1.744873046875, 1.9263916015625, 2.10791015625, 2.2894287109375, 2.470947265625, 2.6524658203125, 2.833984375, 3.0155029296875, 3.197021484375, 3.3785400390625, 3.56005859375, 3.7415771484375, 3.923095703125, 4.1046142578125, 4.2861328125, 4.4676513671875, 4.649169921875, 4.8306884765625, 5.01220703125, 5.1937255859375, 5.375244140625, 5.5567626953125, 5.73828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 16.0, 29.0, 44.0, 98.0, 237.0, 777.0, 6991.0, 667853.0, 366382.0, 5068.0, 673.0, 197.0, 84.0, 50.0, 33.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.52734375, -7.35205078125, -7.1767578125, -7.00146484375, -6.826171875, -6.65087890625, -6.4755859375, -6.30029296875, -6.125, -5.94970703125, -5.7744140625, -5.59912109375, -5.423828125, -5.24853515625, -5.0732421875, -4.89794921875, -4.72265625, -4.54736328125, -4.3720703125, -4.19677734375, -4.021484375, -3.84619140625, -3.6708984375, -3.49560546875, -3.3203125, -3.14501953125, -2.9697265625, -2.79443359375, -2.619140625, -2.44384765625, -2.2685546875, -2.09326171875, -1.91796875, -1.74267578125, -1.5673828125, -1.39208984375, -1.216796875, -1.04150390625, -0.8662109375, -0.69091796875, -0.515625, -0.34033203125, -0.1650390625, 0.01025390625, 0.185546875, 0.36083984375, 0.5361328125, 0.71142578125, 0.88671875, 1.06201171875, 1.2373046875, 1.41259765625, 1.587890625, 1.76318359375, 1.9384765625, 2.11376953125, 2.2890625, 2.46435546875, 2.6396484375, 2.81494140625, 2.990234375, 3.16552734375, 3.3408203125, 3.51611328125, 3.69140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 15.0, 13.0, 22.0, 28.0, 55.0, 79.0, 98.0, 129.0, 136.0, 102.0, 86.0, 79.0, 45.0, 36.0, 20.0, 12.0, 8.0, 12.0, 5.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002484321594238281, -0.00023790448904037476, -0.0002273768186569214, -0.00021684914827346802, -0.00020632147789001465, -0.00019579380750656128, -0.0001852661371231079, -0.00017473846673965454, -0.00016421079635620117, -0.0001536831259727478, -0.00014315545558929443, -0.00013262778520584106, -0.0001221001148223877, -0.00011157244443893433, -0.00010104477405548096, -9.051710367202759e-05, -7.998943328857422e-05, -6.946176290512085e-05, -5.893409252166748e-05, -4.840642213821411e-05, -3.787875175476074e-05, -2.7351081371307373e-05, -1.6823410987854004e-05, -6.295740604400635e-06, 4.231929779052734e-06, 1.4759600162506104e-05, 2.5287270545959473e-05, 3.581494092941284e-05, 4.634261131286621e-05, 5.687028169631958e-05, 6.739795207977295e-05, 7.792562246322632e-05, 8.845329284667969e-05, 9.898096323013306e-05, 0.00010950863361358643, 0.0001200363039970398, 0.00013056397438049316, 0.00014109164476394653, 0.0001516193151473999, 0.00016214698553085327, 0.00017267465591430664, 0.00018320232629776, 0.00019372999668121338, 0.00020425766706466675, 0.00021478533744812012, 0.00022531300783157349, 0.00023584067821502686, 0.0002463683485984802, 0.0002568960189819336, 0.00026742368936538696, 0.00027795135974884033, 0.0002884790301322937, 0.00029900670051574707, 0.00030953437089920044, 0.0003200620412826538, 0.0003305897116661072, 0.00034111738204956055, 0.0003516450524330139, 0.0003621727228164673, 0.00037270039319992065, 0.000383228063583374, 0.0003937557339668274, 0.00040428340435028076, 0.00041481107473373413, 0.0004253387451171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 12.0, 18.0, 36.0, 77.0, 122.0, 241.0, 808.0, 7681.0, 764613.0, 269840.0, 4062.0, 619.0, 221.0, 88.0, 52.0, 22.0, 22.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.10272216796875, -4.9320068359375, -4.76129150390625, -4.590576171875, -4.41986083984375, -4.2491455078125, -4.07843017578125, -3.90771484375, -3.73699951171875, -3.5662841796875, -3.39556884765625, -3.224853515625, -3.05413818359375, -2.8834228515625, -2.71270751953125, -2.5419921875, -2.37127685546875, -2.2005615234375, -2.02984619140625, -1.859130859375, -1.68841552734375, -1.5177001953125, -1.34698486328125, -1.17626953125, -1.00555419921875, -0.8348388671875, -0.66412353515625, -0.493408203125, -0.32269287109375, -0.1519775390625, 0.01873779296875, 0.189453125, 0.36016845703125, 0.5308837890625, 0.70159912109375, 0.872314453125, 1.04302978515625, 1.2137451171875, 1.38446044921875, 1.55517578125, 1.72589111328125, 1.8966064453125, 2.06732177734375, 2.238037109375, 2.40875244140625, 2.5794677734375, 2.75018310546875, 2.9208984375, 3.09161376953125, 3.2623291015625, 3.43304443359375, 3.603759765625, 3.77447509765625, 3.9451904296875, 4.11590576171875, 4.28662109375, 4.45733642578125, 4.6280517578125, 4.79876708984375, 4.969482421875, 5.14019775390625, 5.3109130859375, 5.48162841796875, 5.65234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 22.0, 45.0, 121.0, 219.0, 258.0, 191.0, 77.0, 33.0, 16.0, 8.0, 8.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.637542724609375, -1.46063232421875, -1.283721923828125, -1.1068115234375, -0.929901123046875, -0.75299072265625, -0.576080322265625, -0.399169921875, -0.222259521484375, -0.04534912109375, 0.131561279296875, 0.3084716796875, 0.485382080078125, 0.66229248046875, 0.839202880859375, 1.01611328125, 1.193023681640625, 1.36993408203125, 1.546844482421875, 1.7237548828125, 1.900665283203125, 2.07757568359375, 2.254486083984375, 2.431396484375, 2.608306884765625, 2.78521728515625, 2.962127685546875, 3.1390380859375, 3.315948486328125, 3.49285888671875, 3.669769287109375, 3.8466796875, 4.023590087890625, 4.20050048828125, 4.377410888671875, 4.5543212890625, 4.731231689453125, 4.90814208984375, 5.085052490234375, 5.261962890625, 5.438873291015625, 5.61578369140625, 5.792694091796875, 5.9696044921875, 6.146514892578125, 6.32342529296875, 6.500335693359375, 6.67724609375, 6.854156494140625, 7.03106689453125, 7.207977294921875, 7.3848876953125, 7.561798095703125, 7.73870849609375, 7.915618896484375, 8.092529296875, 8.269439697265625, 8.44635009765625, 8.623260498046875, 8.8001708984375, 8.977081298828125, 9.15399169921875, 9.330902099609375, 9.5078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 10.0, 20.0, 50.0, 103.0, 186.0, 228.0, 183.0, 120.0, 50.0, 25.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.940765380859375, -56.25018310546875, -54.55960464477539, -52.869022369384766, -51.178443908691406, -49.48786163330078, -47.797279357910156, -46.10669708251953, -44.41611862182617, -42.72553634643555, -41.03495788574219, -39.34437561035156, -37.65379333496094, -35.96321487426758, -34.27263259887695, -32.582054138183594, -30.89147186279297, -29.200891494750977, -27.510311126708984, -25.81972885131836, -24.129148483276367, -22.438568115234375, -20.74798583984375, -19.057405471801758, -17.366825103759766, -15.676244735717773, -13.985663414001465, -12.295082092285156, -10.604501724243164, -8.913921356201172, -7.223340034484863, -5.532758712768555, -3.8421783447265625, -2.151597499847412, -0.4610166549682617, 1.2295641899108887, 2.920145034790039, 4.610725402832031, 6.30130672454834, 7.991888046264648, 9.68246841430664, 11.373048782348633, 13.063630104064941, 14.75421142578125, 16.444791793823242, 18.135372161865234, 19.82595443725586, 21.51653480529785, 23.207115173339844, 24.897695541381836, 26.588275909423828, 28.278858184814453, 29.969438552856445, 31.660018920898438, 33.35060119628906, 35.04118347167969, 36.73176193237305, 38.42234420776367, 40.11292266845703, 41.803504943847656, 43.49408721923828, 45.18466567993164, 46.875247955322266, 48.565826416015625, 50.25640869140625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 10.0, 11.0, 14.0, 15.0, 16.0, 23.0, 14.0, 39.0, 36.0, 46.0, 54.0, 45.0, 42.0, 58.0, 47.0, 66.0, 64.0, 63.0, 46.0, 50.0, 37.0, 38.0, 32.0, 20.0, 24.0, 20.0, 13.0, 17.0, 9.0, 14.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.285371780395508, -25.575790405273438, -24.866209030151367, -24.156627655029297, -23.447046279907227, -22.737464904785156, -22.027883529663086, -21.318302154541016, -20.608720779418945, -19.899139404296875, -19.189558029174805, -18.479976654052734, -17.770395278930664, -17.060813903808594, -16.351232528686523, -15.641651153564453, -14.932069778442383, -14.222488403320312, -13.512907028198242, -12.803325653076172, -12.093744277954102, -11.384162902832031, -10.674581527709961, -9.96500015258789, -9.25541877746582, -8.54583740234375, -7.83625602722168, -7.126674652099609, -6.417093276977539, -5.707511901855469, -4.997930526733398, -4.288349151611328, -3.5787696838378906, -2.8691883087158203, -2.15960693359375, -1.4500255584716797, -0.7404441833496094, -0.030862808227539062, 0.6787185668945312, 1.3882999420166016, 2.097881317138672, 2.807462692260742, 3.5170440673828125, 4.226625442504883, 4.936206817626953, 5.645788192749023, 6.355369567871094, 7.064950942993164, 7.774532318115234, 8.484113693237305, 9.193695068359375, 9.903276443481445, 10.612857818603516, 11.322439193725586, 12.032020568847656, 12.741601943969727, 13.451183319091797, 14.160764694213867, 14.870346069335938, 15.579927444458008, 16.289508819580078, 16.99909019470215, 17.70867156982422, 18.41825294494629, 19.12783432006836]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 12.0, 7.0, 19.0, 14.0, 30.0, 72.0, 140.0, 309.0, 752.0, 2063.0, 9281.0, 4119988.0, 54457.0, 4836.0, 1347.0, 505.0, 210.0, 86.0, 56.0, 27.0, 23.0, 16.0, 9.0, 9.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -12.0096435546875, -11.683349609375, -11.3570556640625, -11.03076171875, -10.7044677734375, -10.378173828125, -10.0518798828125, -9.7255859375, -9.3992919921875, -9.072998046875, -8.7467041015625, -8.42041015625, -8.0941162109375, -7.767822265625, -7.4415283203125, -7.115234375, -6.7889404296875, -6.462646484375, -6.1363525390625, -5.81005859375, -5.4837646484375, -5.157470703125, -4.8311767578125, -4.5048828125, -4.1785888671875, -3.852294921875, -3.5260009765625, -3.19970703125, -2.8734130859375, -2.547119140625, -2.2208251953125, -1.89453125, -1.5682373046875, -1.241943359375, -0.9156494140625, -0.58935546875, -0.2630615234375, 0.063232421875, 0.3895263671875, 0.7158203125, 1.0421142578125, 1.368408203125, 1.6947021484375, 2.02099609375, 2.3472900390625, 2.673583984375, 2.9998779296875, 3.326171875, 3.6524658203125, 3.978759765625, 4.3050537109375, 4.63134765625, 4.9576416015625, 5.283935546875, 5.6102294921875, 5.9365234375, 6.2628173828125, 6.589111328125, 6.9154052734375, 7.24169921875, 7.5679931640625, 7.894287109375, 8.2205810546875, 8.546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 14.0, 13.0, 20.0, 24.0, 21.0, 33.0, 25.0, 53.0, 52.0, 48.0, 67.0, 58.0, 70.0, 71.0, 68.0, 66.0, 46.0, 48.0, 28.0, 32.0, 22.0, 22.0, 18.0, 12.0, 15.0, 7.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.154296875, -1.1186676025390625, -1.083038330078125, -1.0474090576171875, -1.01177978515625, -0.9761505126953125, -0.940521240234375, -0.9048919677734375, -0.8692626953125, -0.8336334228515625, -0.798004150390625, -0.7623748779296875, -0.72674560546875, -0.6911163330078125, -0.655487060546875, -0.6198577880859375, -0.584228515625, -0.5485992431640625, -0.512969970703125, -0.4773406982421875, -0.44171142578125, -0.4060821533203125, -0.370452880859375, -0.3348236083984375, -0.2991943359375, -0.2635650634765625, -0.227935791015625, -0.1923065185546875, -0.15667724609375, -0.1210479736328125, -0.085418701171875, -0.0497894287109375, -0.01416015625, 0.0214691162109375, 0.057098388671875, 0.0927276611328125, 0.12835693359375, 0.1639862060546875, 0.199615478515625, 0.2352447509765625, 0.2708740234375, 0.3065032958984375, 0.342132568359375, 0.3777618408203125, 0.41339111328125, 0.4490203857421875, 0.484649658203125, 0.5202789306640625, 0.555908203125, 0.5915374755859375, 0.627166748046875, 0.6627960205078125, 0.69842529296875, 0.7340545654296875, 0.769683837890625, 0.8053131103515625, 0.8409423828125, 0.8765716552734375, 0.912200927734375, 0.9478302001953125, 0.98345947265625, 1.0190887451171875, 1.054718017578125, 1.0903472900390625, 1.1259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 10.0, 7.0, 11.0, 16.0, 31.0, 27.0, 45.0, 55.0, 68.0, 114.0, 169.0, 249.0, 512.0, 1347.0, 4498.0, 22864.0, 4058779.0, 90962.0, 10051.0, 2483.0, 889.0, 422.0, 198.0, 105.0, 96.0, 69.0, 43.0, 42.0, 32.0, 23.0, 12.0, 17.0, 9.0, 3.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.17578125, -6.93475341796875, -6.6937255859375, -6.45269775390625, -6.211669921875, -5.97064208984375, -5.7296142578125, -5.48858642578125, -5.24755859375, -5.00653076171875, -4.7655029296875, -4.52447509765625, -4.283447265625, -4.04241943359375, -3.8013916015625, -3.56036376953125, -3.3193359375, -3.07830810546875, -2.8372802734375, -2.59625244140625, -2.355224609375, -2.11419677734375, -1.8731689453125, -1.63214111328125, -1.39111328125, -1.15008544921875, -0.9090576171875, -0.66802978515625, -0.427001953125, -0.18597412109375, 0.0550537109375, 0.29608154296875, 0.537109375, 0.77813720703125, 1.0191650390625, 1.26019287109375, 1.501220703125, 1.74224853515625, 1.9832763671875, 2.22430419921875, 2.46533203125, 2.70635986328125, 2.9473876953125, 3.18841552734375, 3.429443359375, 3.67047119140625, 3.9114990234375, 4.15252685546875, 4.3935546875, 4.63458251953125, 4.8756103515625, 5.11663818359375, 5.357666015625, 5.59869384765625, 5.8397216796875, 6.08074951171875, 6.32177734375, 6.56280517578125, 6.8038330078125, 7.04486083984375, 7.285888671875, 7.52691650390625, 7.7679443359375, 8.00897216796875, 8.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 6.0, 20.0, 34.0, 74.0, 3641.0, 197.0, 48.0, 19.0, 14.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6650390625, -1.6029510498046875, -1.540863037109375, -1.4787750244140625, -1.41668701171875, -1.3545989990234375, -1.292510986328125, -1.2304229736328125, -1.1683349609375, -1.1062469482421875, -1.044158935546875, -0.9820709228515625, -0.91998291015625, -0.8578948974609375, -0.795806884765625, -0.7337188720703125, -0.671630859375, -0.6095428466796875, -0.547454833984375, -0.4853668212890625, -0.42327880859375, -0.3611907958984375, -0.299102783203125, -0.2370147705078125, -0.1749267578125, -0.1128387451171875, -0.050750732421875, 0.0113372802734375, 0.07342529296875, 0.1355133056640625, 0.197601318359375, 0.2596893310546875, 0.32177734375, 0.3838653564453125, 0.445953369140625, 0.5080413818359375, 0.57012939453125, 0.6322174072265625, 0.694305419921875, 0.7563934326171875, 0.8184814453125, 0.8805694580078125, 0.942657470703125, 1.0047454833984375, 1.06683349609375, 1.1289215087890625, 1.191009521484375, 1.2530975341796875, 1.315185546875, 1.3772735595703125, 1.439361572265625, 1.5014495849609375, 1.56353759765625, 1.6256256103515625, 1.687713623046875, 1.7498016357421875, 1.8118896484375, 1.8739776611328125, 1.936065673828125, 1.9981536865234375, 2.06024169921875, 2.1223297119140625, 2.184417724609375, 2.2465057373046875, 2.30859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 12.0, 13.0, 17.0, 24.0, 32.0, 38.0, 41.0, 57.0, 79.0, 68.0, 65.0, 73.0, 94.0, 68.0, 68.0, 59.0, 51.0, 35.0, 23.0, 14.0, 18.0, 9.0, 11.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.3411476612091064, -3.254560947418213, -3.1679739952087402, -3.0813872814178467, -2.994800567626953, -2.9082138538360596, -2.821627140045166, -2.7350401878356934, -2.6484534740448, -2.5618667602539062, -2.4752798080444336, -2.38869309425354, -2.3021063804626465, -2.215519666671753, -2.1289329528808594, -2.0423460006713867, -1.9557592868804932, -1.86917245388031, -1.7825857400894165, -1.6959989070892334, -1.6094121932983398, -1.5228254795074463, -1.4362386465072632, -1.3496520519256592, -1.2630653381347656, -1.1764785051345825, -1.089891791343689, -1.0033049583435059, -0.9167182445526123, -0.830131471157074, -0.7435446977615356, -0.6569578647613525, -0.5703710913658142, -0.4837843179702759, -0.39719757437705994, -0.3106108009815216, -0.22402402758598328, -0.13743728399276733, -0.050850510597229004, 0.035736262798309326, 0.12232302874326706, 0.2089097946882248, 0.29549655318260193, 0.38208332657814026, 0.4686700999736786, 0.5552568435668945, 0.6418436169624329, 0.7284303903579712, 0.8150171637535095, 0.9016039371490479, 0.9881906509399414, 1.0747774839401245, 1.161364197731018, 1.2479510307312012, 1.3345377445220947, 1.4211244583129883, 1.5077111721038818, 1.594298005104065, 1.6808847188949585, 1.7674715518951416, 1.8540582656860352, 1.9406449794769287, 2.0272316932678223, 2.113818645477295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 13.0, 6.0, 12.0, 13.0, 15.0, 18.0, 22.0, 21.0, 33.0, 33.0, 40.0, 34.0, 38.0, 39.0, 42.0, 57.0, 49.0, 39.0, 38.0, 32.0, 42.0, 32.0, 44.0, 30.0, 28.0, 34.0, 21.0, 24.0, 20.0, 15.0, 18.0, 12.0, 18.0, 5.0, 12.0, 11.0, 3.0, 2.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.3478598594665527, -2.2728610038757324, -2.197861909866333, -2.1228628158569336, -2.0478639602661133, -1.9728649854660034, -1.8978660106658936, -1.8228670358657837, -1.7478680610656738, -1.672869086265564, -1.597870111465454, -1.5228711366653442, -1.4478721618652344, -1.3728731870651245, -1.2978742122650146, -1.2228752374649048, -1.147876262664795, -1.072877287864685, -0.9978783130645752, -0.9228793382644653, -0.8478803634643555, -0.7728813886642456, -0.6978824138641357, -0.6228834390640259, -0.547884464263916, -0.47288548946380615, -0.3978865146636963, -0.3228875398635864, -0.24788856506347656, -0.1728895902633667, -0.09789061546325684, -0.022891640663146973, 0.05210709571838379, 0.12710607051849365, 0.20210504531860352, 0.2771040201187134, 0.35210299491882324, 0.4271019697189331, 0.502100944519043, 0.5770999193191528, 0.6520988941192627, 0.7270978689193726, 0.8020968437194824, 0.8770958185195923, 0.9520947933197021, 1.027093768119812, 1.1020927429199219, 1.1770917177200317, 1.2520906925201416, 1.3270896673202515, 1.4020886421203613, 1.4770876169204712, 1.552086591720581, 1.627085566520691, 1.7020845413208008, 1.7770835161209106, 1.8520824909210205, 1.9270814657211304, 2.0020804405212402, 2.0770792961120605, 2.15207839012146, 2.2270774841308594, 2.3020763397216797, 2.3770751953125, 2.4520742893218994]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 8.0, 6.0, 7.0, 7.0, 19.0, 24.0, 33.0, 64.0, 88.0, 157.0, 289.0, 590.0, 1078.0, 2492.0, 5797.0, 15155.0, 45330.0, 148427.0, 386642.0, 297648.0, 96095.0, 30043.0, 10500.0, 4199.0, 1877.0, 892.0, 481.0, 236.0, 138.0, 75.0, 60.0, 28.0, 25.0, 11.0, 13.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.119140625, -3.034423828125, -2.94970703125, -2.864990234375, -2.7802734375, -2.695556640625, -2.61083984375, -2.526123046875, -2.44140625, -2.356689453125, -2.27197265625, -2.187255859375, -2.1025390625, -2.017822265625, -1.93310546875, -1.848388671875, -1.763671875, -1.678955078125, -1.59423828125, -1.509521484375, -1.4248046875, -1.340087890625, -1.25537109375, -1.170654296875, -1.0859375, -1.001220703125, -0.91650390625, -0.831787109375, -0.7470703125, -0.662353515625, -0.57763671875, -0.492919921875, -0.408203125, -0.323486328125, -0.23876953125, -0.154052734375, -0.0693359375, 0.015380859375, 0.10009765625, 0.184814453125, 0.26953125, 0.354248046875, 0.43896484375, 0.523681640625, 0.6083984375, 0.693115234375, 0.77783203125, 0.862548828125, 0.947265625, 1.031982421875, 1.11669921875, 1.201416015625, 1.2861328125, 1.370849609375, 1.45556640625, 1.540283203125, 1.625, 1.709716796875, 1.79443359375, 1.879150390625, 1.9638671875, 2.048583984375, 2.13330078125, 2.218017578125, 2.302734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 4.0, 8.0, 3.0, 3.0, 11.0, 16.0, 20.0, 11.0, 18.0, 18.0, 31.0, 32.0, 36.0, 36.0, 51.0, 48.0, 55.0, 54.0, 56.0, 54.0, 54.0, 50.0, 48.0, 40.0, 35.0, 41.0, 28.0, 30.0, 23.0, 13.0, 13.0, 10.0, 9.0, 11.0, 4.0, 2.0, 7.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.203125, -1.168212890625, -1.13330078125, -1.098388671875, -1.0634765625, -1.028564453125, -0.99365234375, -0.958740234375, -0.923828125, -0.888916015625, -0.85400390625, -0.819091796875, -0.7841796875, -0.749267578125, -0.71435546875, -0.679443359375, -0.64453125, -0.609619140625, -0.57470703125, -0.539794921875, -0.5048828125, -0.469970703125, -0.43505859375, -0.400146484375, -0.365234375, -0.330322265625, -0.29541015625, -0.260498046875, -0.2255859375, -0.190673828125, -0.15576171875, -0.120849609375, -0.0859375, -0.051025390625, -0.01611328125, 0.018798828125, 0.0537109375, 0.088623046875, 0.12353515625, 0.158447265625, 0.193359375, 0.228271484375, 0.26318359375, 0.298095703125, 0.3330078125, 0.367919921875, 0.40283203125, 0.437744140625, 0.47265625, 0.507568359375, 0.54248046875, 0.577392578125, 0.6123046875, 0.647216796875, 0.68212890625, 0.717041015625, 0.751953125, 0.786865234375, 0.82177734375, 0.856689453125, 0.8916015625, 0.926513671875, 0.96142578125, 0.996337890625, 1.03125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 5.0, 11.0, 23.0, 28.0, 37.0, 55.0, 116.0, 212.0, 400.0, 859.0, 2287.0, 8027.0, 40721.0, 334975.0, 570693.0, 72603.0, 12197.0, 3192.0, 1084.0, 486.0, 231.0, 121.0, 64.0, 30.0, 29.0, 20.0, 13.0, 7.0, 3.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.10418701171875, -3.9583740234375, -3.81256103515625, -3.666748046875, -3.52093505859375, -3.3751220703125, -3.22930908203125, -3.08349609375, -2.93768310546875, -2.7918701171875, -2.64605712890625, -2.500244140625, -2.35443115234375, -2.2086181640625, -2.06280517578125, -1.9169921875, -1.77117919921875, -1.6253662109375, -1.47955322265625, -1.333740234375, -1.18792724609375, -1.0421142578125, -0.89630126953125, -0.75048828125, -0.60467529296875, -0.4588623046875, -0.31304931640625, -0.167236328125, -0.02142333984375, 0.1243896484375, 0.27020263671875, 0.416015625, 0.56182861328125, 0.7076416015625, 0.85345458984375, 0.999267578125, 1.14508056640625, 1.2908935546875, 1.43670654296875, 1.58251953125, 1.72833251953125, 1.8741455078125, 2.01995849609375, 2.165771484375, 2.31158447265625, 2.4573974609375, 2.60321044921875, 2.7490234375, 2.89483642578125, 3.0406494140625, 3.18646240234375, 3.332275390625, 3.47808837890625, 3.6239013671875, 3.76971435546875, 3.91552734375, 4.06134033203125, 4.2071533203125, 4.35296630859375, 4.498779296875, 4.64459228515625, 4.7904052734375, 4.93621826171875, 5.08203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 18.0, 19.0, 23.0, 26.0, 36.0, 44.0, 46.0, 46.0, 51.0, 62.0, 58.0, 57.0, 58.0, 54.0, 50.0, 64.0, 46.0, 43.0, 32.0, 37.0, 28.0, 25.0, 19.0, 13.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.4505615234375, -6.221435546875, -5.9923095703125, -5.76318359375, -5.5340576171875, -5.304931640625, -5.0758056640625, -4.8466796875, -4.6175537109375, -4.388427734375, -4.1593017578125, -3.93017578125, -3.7010498046875, -3.471923828125, -3.2427978515625, -3.013671875, -2.7845458984375, -2.555419921875, -2.3262939453125, -2.09716796875, -1.8680419921875, -1.638916015625, -1.4097900390625, -1.1806640625, -0.9515380859375, -0.722412109375, -0.4932861328125, -0.26416015625, -0.0350341796875, 0.194091796875, 0.4232177734375, 0.65234375, 0.8814697265625, 1.110595703125, 1.3397216796875, 1.56884765625, 1.7979736328125, 2.027099609375, 2.2562255859375, 2.4853515625, 2.7144775390625, 2.943603515625, 3.1727294921875, 3.40185546875, 3.6309814453125, 3.860107421875, 4.0892333984375, 4.318359375, 4.5474853515625, 4.776611328125, 5.0057373046875, 5.23486328125, 5.4639892578125, 5.693115234375, 5.9222412109375, 6.1513671875, 6.3804931640625, 6.609619140625, 6.8387451171875, 7.06787109375, 7.2969970703125, 7.526123046875, 7.7552490234375, 7.984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 12.0, 3.0, 8.0, 14.0, 16.0, 40.0, 72.0, 120.0, 212.0, 548.0, 1716.0, 11132.0, 472981.0, 546893.0, 11970.0, 1756.0, 535.0, 237.0, 124.0, 64.0, 42.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.92327880859375, -4.7645263671875, -4.60577392578125, -4.447021484375, -4.28826904296875, -4.1295166015625, -3.97076416015625, -3.81201171875, -3.65325927734375, -3.4945068359375, -3.33575439453125, -3.177001953125, -3.01824951171875, -2.8594970703125, -2.70074462890625, -2.5419921875, -2.38323974609375, -2.2244873046875, -2.06573486328125, -1.906982421875, -1.74822998046875, -1.5894775390625, -1.43072509765625, -1.27197265625, -1.11322021484375, -0.9544677734375, -0.79571533203125, -0.636962890625, -0.47821044921875, -0.3194580078125, -0.16070556640625, -0.001953125, 0.15679931640625, 0.3155517578125, 0.47430419921875, 0.633056640625, 0.79180908203125, 0.9505615234375, 1.10931396484375, 1.26806640625, 1.42681884765625, 1.5855712890625, 1.74432373046875, 1.903076171875, 2.06182861328125, 2.2205810546875, 2.37933349609375, 2.5380859375, 2.69683837890625, 2.8555908203125, 3.01434326171875, 3.173095703125, 3.33184814453125, 3.4906005859375, 3.64935302734375, 3.80810546875, 3.96685791015625, 4.1256103515625, 4.28436279296875, 4.443115234375, 4.60186767578125, 4.7606201171875, 4.91937255859375, 5.078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 27.0, 30.0, 50.0, 49.0, 103.0, 118.0, 128.0, 145.0, 107.0, 77.0, 49.0, 31.0, 21.0, 15.0, 9.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005693435668945312, -0.0005553476512432098, -0.0005413517355918884, -0.000527355819940567, -0.0005133599042892456, -0.0004993639886379242, -0.0004853680729866028, -0.00047137215733528137, -0.00045737624168395996, -0.00044338032603263855, -0.00042938441038131714, -0.00041538849472999573, -0.0004013925790786743, -0.0003873966634273529, -0.0003734007477760315, -0.0003594048321247101, -0.00034540891647338867, -0.00033141300082206726, -0.00031741708517074585, -0.00030342116951942444, -0.00028942525386810303, -0.0002754293382167816, -0.0002614334225654602, -0.0002474375069141388, -0.00023344159126281738, -0.00021944567561149597, -0.00020544975996017456, -0.00019145384430885315, -0.00017745792865753174, -0.00016346201300621033, -0.00014946609735488892, -0.0001354701817035675, -0.0001214742660522461, -0.00010747835040092468, -9.348243474960327e-05, -7.948651909828186e-05, -6.549060344696045e-05, -5.149468779563904e-05, -3.749877214431763e-05, -2.3502856492996216e-05, -9.506940841674805e-06, 4.4889748096466064e-06, 1.8484890460968018e-05, 3.248080611228943e-05, 4.647672176361084e-05, 6.047263741493225e-05, 7.446855306625366e-05, 8.846446871757507e-05, 0.00010246038436889648, 0.0001164563000202179, 0.0001304522156715393, 0.00014444813132286072, 0.00015844404697418213, 0.00017243996262550354, 0.00018643587827682495, 0.00020043179392814636, 0.00021442770957946777, 0.00022842362523078918, 0.0002424195408821106, 0.000256415456533432, 0.0002704113721847534, 0.00028440728783607483, 0.00029840320348739624, 0.00031239911913871765, 0.00032639503479003906]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 9.0, 15.0, 16.0, 48.0, 68.0, 115.0, 237.0, 450.0, 1078.0, 2924.0, 11790.0, 89217.0, 795351.0, 126864.0, 14523.0, 3607.0, 1206.0, 494.0, 239.0, 111.0, 74.0, 40.0, 28.0, 10.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.8765869140625, -2.782470703125, -2.6883544921875, -2.59423828125, -2.5001220703125, -2.406005859375, -2.3118896484375, -2.2177734375, -2.1236572265625, -2.029541015625, -1.9354248046875, -1.84130859375, -1.7471923828125, -1.653076171875, -1.5589599609375, -1.46484375, -1.3707275390625, -1.276611328125, -1.1824951171875, -1.08837890625, -0.9942626953125, -0.900146484375, -0.8060302734375, -0.7119140625, -0.6177978515625, -0.523681640625, -0.4295654296875, -0.33544921875, -0.2413330078125, -0.147216796875, -0.0531005859375, 0.041015625, 0.1351318359375, 0.229248046875, 0.3233642578125, 0.41748046875, 0.5115966796875, 0.605712890625, 0.6998291015625, 0.7939453125, 0.8880615234375, 0.982177734375, 1.0762939453125, 1.17041015625, 1.2645263671875, 1.358642578125, 1.4527587890625, 1.546875, 1.6409912109375, 1.735107421875, 1.8292236328125, 1.92333984375, 2.0174560546875, 2.111572265625, 2.2056884765625, 2.2998046875, 2.3939208984375, 2.488037109375, 2.5821533203125, 2.67626953125, 2.7703857421875, 2.864501953125, 2.9586181640625, 3.052734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 7.0, 1.0, 6.0, 8.0, 15.0, 13.0, 20.0, 29.0, 43.0, 50.0, 75.0, 101.0, 120.0, 134.0, 109.0, 70.0, 63.0, 32.0, 25.0, 21.0, 15.0, 11.0, 9.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.40234375, -3.30487060546875, -3.2073974609375, -3.10992431640625, -3.012451171875, -2.91497802734375, -2.8175048828125, -2.72003173828125, -2.62255859375, -2.52508544921875, -2.4276123046875, -2.33013916015625, -2.232666015625, -2.13519287109375, -2.0377197265625, -1.94024658203125, -1.8427734375, -1.74530029296875, -1.6478271484375, -1.55035400390625, -1.452880859375, -1.35540771484375, -1.2579345703125, -1.16046142578125, -1.06298828125, -0.96551513671875, -0.8680419921875, -0.77056884765625, -0.673095703125, -0.57562255859375, -0.4781494140625, -0.38067626953125, -0.283203125, -0.18572998046875, -0.0882568359375, 0.00921630859375, 0.106689453125, 0.20416259765625, 0.3016357421875, 0.39910888671875, 0.49658203125, 0.59405517578125, 0.6915283203125, 0.78900146484375, 0.886474609375, 0.98394775390625, 1.0814208984375, 1.17889404296875, 1.2763671875, 1.37384033203125, 1.4713134765625, 1.56878662109375, 1.666259765625, 1.76373291015625, 1.8612060546875, 1.95867919921875, 2.05615234375, 2.15362548828125, 2.2510986328125, 2.34857177734375, 2.446044921875, 2.54351806640625, 2.6409912109375, 2.73846435546875, 2.8359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 12.0, 14.0, 17.0, 29.0, 57.0, 94.0, 118.0, 161.0, 156.0, 96.0, 95.0, 64.0, 33.0, 20.0, 8.0, 14.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.67017364501953, -44.55193328857422, -43.433692932128906, -42.31545639038086, -41.19721603393555, -40.078975677490234, -38.96073913574219, -37.842498779296875, -36.72425842285156, -35.60601806640625, -34.48777770996094, -33.36954116821289, -32.25130081176758, -31.133060455322266, -30.014822006225586, -28.896583557128906, -27.778343200683594, -26.66010284423828, -25.5418643951416, -24.423625946044922, -23.30538558959961, -22.187145233154297, -21.068906784057617, -19.950668334960938, -18.832427978515625, -17.714187622070312, -16.595949172973633, -15.477709770202637, -14.35947036743164, -13.241230964660645, -12.122991561889648, -11.004752159118652, -9.886512756347656, -8.76827335357666, -7.650033950805664, -6.531794548034668, -5.413555145263672, -4.295315742492676, -3.1770763397216797, -2.0588369369506836, -0.9405975341796875, 0.1776418685913086, 1.2958812713623047, 2.414120674133301, 3.532360076904297, 4.650599479675293, 5.768838882446289, 6.887078285217285, 8.005317687988281, 9.123557090759277, 10.241796493530273, 11.36003589630127, 12.478275299072266, 13.596514701843262, 14.714754104614258, 15.832993507385254, 16.95123291015625, 18.069473266601562, 19.187711715698242, 20.305950164794922, 21.424190521240234, 22.542430877685547, 23.660669326782227, 24.778907775878906, 25.89714813232422]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 1.0, 7.0, 10.0, 12.0, 9.0, 18.0, 13.0, 18.0, 20.0, 24.0, 22.0, 24.0, 22.0, 36.0, 39.0, 36.0, 47.0, 52.0, 41.0, 42.0, 48.0, 43.0, 47.0, 41.0, 36.0, 40.0, 37.0, 22.0, 28.0, 25.0, 18.0, 18.0, 19.0, 9.0, 13.0, 13.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.017623901367188, -22.295289993286133, -21.572956085205078, -20.850622177124023, -20.12828826904297, -19.405956268310547, -18.683622360229492, -17.961288452148438, -17.238954544067383, -16.516620635986328, -15.794286727905273, -15.071953773498535, -14.34961986541748, -13.627285957336426, -12.904953002929688, -12.182619094848633, -11.460285186767578, -10.737951278686523, -10.015617370605469, -9.29328441619873, -8.570950508117676, -7.848616600036621, -7.126283168792725, -6.403949737548828, -5.681615829467773, -4.959281921386719, -4.236948490142822, -3.5146148204803467, -2.792281150817871, -2.0699474811553955, -1.34761381149292, -0.6252803802490234, 0.09705352783203125, 0.8193871974945068, 1.5417208671569824, 2.264054536819458, 2.9863882064819336, 3.708721876144409, 4.431055545806885, 5.153388977050781, 5.875722885131836, 6.598056793212891, 7.320390224456787, 8.042723655700684, 8.765057563781738, 9.487391471862793, 10.209724426269531, 10.932058334350586, 11.65439224243164, 12.376726150512695, 13.09906005859375, 13.821393013000488, 14.543726921081543, 15.266060829162598, 15.988393783569336, 16.71072769165039, 17.433061599731445, 18.1553955078125, 18.877729415893555, 19.60006332397461, 20.32239532470703, 21.044729232788086, 21.76706314086914, 22.489397048950195, 23.21173095703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 11.0, 14.0, 22.0, 37.0, 63.0, 112.0, 216.0, 455.0, 1021.0, 3057.0, 12103.0, 148594.0, 3998169.0, 23362.0, 4563.0, 1403.0, 548.0, 269.0, 109.0, 62.0, 38.0, 25.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.46710205078125, -7.2662353515625, -7.06536865234375, -6.864501953125, -6.66363525390625, -6.4627685546875, -6.26190185546875, -6.06103515625, -5.86016845703125, -5.6593017578125, -5.45843505859375, -5.257568359375, -5.05670166015625, -4.8558349609375, -4.65496826171875, -4.4541015625, -4.25323486328125, -4.0523681640625, -3.85150146484375, -3.650634765625, -3.44976806640625, -3.2489013671875, -3.04803466796875, -2.84716796875, -2.64630126953125, -2.4454345703125, -2.24456787109375, -2.043701171875, -1.84283447265625, -1.6419677734375, -1.44110107421875, -1.240234375, -1.03936767578125, -0.8385009765625, -0.63763427734375, -0.436767578125, -0.23590087890625, -0.0350341796875, 0.16583251953125, 0.36669921875, 0.56756591796875, 0.7684326171875, 0.96929931640625, 1.170166015625, 1.37103271484375, 1.5718994140625, 1.77276611328125, 1.9736328125, 2.17449951171875, 2.3753662109375, 2.57623291015625, 2.777099609375, 2.97796630859375, 3.1788330078125, 3.37969970703125, 3.58056640625, 3.78143310546875, 3.9822998046875, 4.18316650390625, 4.384033203125, 4.58489990234375, 4.7857666015625, 4.98663330078125, 5.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 10.0, 8.0, 5.0, 16.0, 27.0, 31.0, 46.0, 64.0, 79.0, 76.0, 83.0, 92.0, 84.0, 64.0, 89.0, 71.0, 37.0, 36.0, 14.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.153106689453125, -2.09527587890625, -2.037445068359375, -1.9796142578125, -1.921783447265625, -1.86395263671875, -1.806121826171875, -1.748291015625, -1.690460205078125, -1.63262939453125, -1.574798583984375, -1.5169677734375, -1.459136962890625, -1.40130615234375, -1.343475341796875, -1.28564453125, -1.227813720703125, -1.16998291015625, -1.112152099609375, -1.0543212890625, -0.996490478515625, -0.93865966796875, -0.880828857421875, -0.822998046875, -0.765167236328125, -0.70733642578125, -0.649505615234375, -0.5916748046875, -0.533843994140625, -0.47601318359375, -0.418182373046875, -0.3603515625, -0.302520751953125, -0.24468994140625, -0.186859130859375, -0.1290283203125, -0.071197509765625, -0.01336669921875, 0.044464111328125, 0.102294921875, 0.160125732421875, 0.21795654296875, 0.275787353515625, 0.3336181640625, 0.391448974609375, 0.44927978515625, 0.507110595703125, 0.56494140625, 0.622772216796875, 0.68060302734375, 0.738433837890625, 0.7962646484375, 0.854095458984375, 0.91192626953125, 0.969757080078125, 1.027587890625, 1.085418701171875, 1.14324951171875, 1.201080322265625, 1.2589111328125, 1.316741943359375, 1.37457275390625, 1.432403564453125, 1.490234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 3.0, 19.0, 18.0, 26.0, 29.0, 49.0, 53.0, 81.0, 189.0, 358.0, 922.0, 2764.0, 17681.0, 4051306.0, 111600.0, 6395.0, 1532.0, 561.0, 245.0, 149.0, 81.0, 61.0, 41.0, 26.0, 23.0, 12.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.1611328125, -6.798828125, -6.4365234375, -6.07421875, -5.7119140625, -5.349609375, -4.9873046875, -4.625, -4.2626953125, -3.900390625, -3.5380859375, -3.17578125, -2.8134765625, -2.451171875, -2.0888671875, -1.7265625, -1.3642578125, -1.001953125, -0.6396484375, -0.27734375, 0.0849609375, 0.447265625, 0.8095703125, 1.171875, 1.5341796875, 1.896484375, 2.2587890625, 2.62109375, 2.9833984375, 3.345703125, 3.7080078125, 4.0703125, 4.4326171875, 4.794921875, 5.1572265625, 5.51953125, 5.8818359375, 6.244140625, 6.6064453125, 6.96875, 7.3310546875, 7.693359375, 8.0556640625, 8.41796875, 8.7802734375, 9.142578125, 9.5048828125, 9.8671875, 10.2294921875, 10.591796875, 10.9541015625, 11.31640625, 11.6787109375, 12.041015625, 12.4033203125, 12.765625, 13.1279296875, 13.490234375, 13.8525390625, 14.21484375, 14.5771484375, 14.939453125, 15.3017578125, 15.6640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 24.0, 50.0, 210.0, 3458.0, 206.0, 60.0, 27.0, 13.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.381103515625, -2.22705078125, -2.072998046875, -1.9189453125, -1.764892578125, -1.61083984375, -1.456787109375, -1.302734375, -1.148681640625, -0.99462890625, -0.840576171875, -0.6865234375, -0.532470703125, -0.37841796875, -0.224365234375, -0.0703125, 0.083740234375, 0.23779296875, 0.391845703125, 0.5458984375, 0.699951171875, 0.85400390625, 1.008056640625, 1.162109375, 1.316162109375, 1.47021484375, 1.624267578125, 1.7783203125, 1.932373046875, 2.08642578125, 2.240478515625, 2.39453125, 2.548583984375, 2.70263671875, 2.856689453125, 3.0107421875, 3.164794921875, 3.31884765625, 3.472900390625, 3.626953125, 3.781005859375, 3.93505859375, 4.089111328125, 4.2431640625, 4.397216796875, 4.55126953125, 4.705322265625, 4.859375, 5.013427734375, 5.16748046875, 5.321533203125, 5.4755859375, 5.629638671875, 5.78369140625, 5.937744140625, 6.091796875, 6.245849609375, 6.39990234375, 6.553955078125, 6.7080078125, 6.862060546875, 7.01611328125, 7.170166015625, 7.32421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 36.0, 88.0, 245.0, 348.0, 201.0, 57.0, 18.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.21238899230957, -16.321622848510742, -15.430856704711914, -14.540090560913086, -13.649324417114258, -12.75855827331543, -11.867791175842285, -10.977025032043457, -10.086258888244629, -9.1954927444458, -8.304726600646973, -7.413959980010986, -6.523193836212158, -5.63242769241333, -4.741661071777344, -3.8508949279785156, -2.9601287841796875, -2.0693626403808594, -1.1785962581634521, -0.2878298759460449, 0.6029362678527832, 1.4937024116516113, 2.3844690322875977, 3.275235176086426, 4.166001319885254, 5.056767463684082, 5.94753360748291, 6.8383002281188965, 7.729066371917725, 8.619832992553711, 9.510599136352539, 10.401365280151367, 11.292133331298828, 12.182899475097656, 13.073665618896484, 13.964431762695312, 14.85519790649414, 15.745964050292969, 16.636730194091797, 17.527496337890625, 18.418262481689453, 19.30902862548828, 20.19979476928711, 21.090560913085938, 21.981327056884766, 22.872093200683594, 23.762859344482422, 24.65362548828125, 25.54439353942871, 26.43515968322754, 27.325925827026367, 28.216691970825195, 29.107458114624023, 29.99822425842285, 30.888992309570312, 31.77975845336914, 32.67052459716797, 33.5612907409668, 34.452056884765625, 35.34282302856445, 36.23358917236328, 37.12435531616211, 38.01512145996094, 38.905887603759766, 39.796653747558594]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 21.0, 29.0, 39.0, 72.0, 66.0, 82.0, 106.0, 92.0, 89.0, 96.0, 70.0, 67.0, 49.0, 33.0, 25.0, 19.0, 9.0, 4.0, 8.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.999860763549805, -12.589277267456055, -12.178694725036621, -11.768112182617188, -11.357528686523438, -10.946945190429688, -10.536362648010254, -10.12578010559082, -9.71519660949707, -9.30461311340332, -8.894030570983887, -8.483448028564453, -8.072864532470703, -7.662281513214111, -7.2516984939575195, -6.841115474700928, -6.430532455444336, -6.019949436187744, -5.609366416931152, -5.1987833976745605, -4.788200378417969, -4.377617359161377, -3.967034339904785, -3.5564513206481934, -3.1458683013916016, -2.7352852821350098, -2.324702262878418, -1.9141192436218262, -1.5035362243652344, -1.0929532051086426, -0.6823701858520508, -0.271787166595459, 0.1387948989868164, 0.5493779182434082, 0.9599609375, 1.3705439567565918, 1.7811269760131836, 2.1917099952697754, 2.602293014526367, 3.012876033782959, 3.423459053039551, 3.8340420722961426, 4.244625091552734, 4.655208110809326, 5.065791130065918, 5.47637414932251, 5.886957168579102, 6.297540187835693, 6.708123207092285, 7.118706226348877, 7.529289245605469, 7.9398722648620605, 8.350455284118652, 8.761037826538086, 9.171621322631836, 9.582204818725586, 9.99278736114502, 10.403369903564453, 10.813953399658203, 11.224536895751953, 11.635119438171387, 12.04570198059082, 12.45628547668457, 12.86686897277832, 13.277451515197754]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 7.0, 12.0, 15.0, 24.0, 37.0, 57.0, 75.0, 113.0, 164.0, 270.0, 455.0, 808.0, 1514.0, 3023.0, 6976.0, 19208.0, 65711.0, 255612.0, 461734.0, 165517.0, 43141.0, 13476.0, 5229.0, 2456.0, 1204.0, 675.0, 389.0, 209.0, 153.0, 102.0, 62.0, 36.0, 23.0, 13.0, 15.0, 8.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.533721923828125, -3.42095947265625, -3.308197021484375, -3.1954345703125, -3.082672119140625, -2.96990966796875, -2.857147216796875, -2.744384765625, -2.631622314453125, -2.51885986328125, -2.406097412109375, -2.2933349609375, -2.180572509765625, -2.06781005859375, -1.955047607421875, -1.84228515625, -1.729522705078125, -1.61676025390625, -1.503997802734375, -1.3912353515625, -1.278472900390625, -1.16571044921875, -1.052947998046875, -0.940185546875, -0.827423095703125, -0.71466064453125, -0.601898193359375, -0.4891357421875, -0.376373291015625, -0.26361083984375, -0.150848388671875, -0.0380859375, 0.074676513671875, 0.18743896484375, 0.300201416015625, 0.4129638671875, 0.525726318359375, 0.63848876953125, 0.751251220703125, 0.864013671875, 0.976776123046875, 1.08953857421875, 1.202301025390625, 1.3150634765625, 1.427825927734375, 1.54058837890625, 1.653350830078125, 1.76611328125, 1.878875732421875, 1.99163818359375, 2.104400634765625, 2.2171630859375, 2.329925537109375, 2.44268798828125, 2.555450439453125, 2.668212890625, 2.780975341796875, 2.89373779296875, 3.006500244140625, 3.1192626953125, 3.232025146484375, 3.34478759765625, 3.457550048828125, 3.5703125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 6.0, 7.0, 7.0, 15.0, 15.0, 15.0, 26.0, 34.0, 30.0, 66.0, 69.0, 58.0, 77.0, 79.0, 82.0, 60.0, 61.0, 65.0, 60.0, 44.0, 30.0, 33.0, 18.0, 7.0, 10.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.052337646484375, -1.99334716796875, -1.934356689453125, -1.8753662109375, -1.816375732421875, -1.75738525390625, -1.698394775390625, -1.639404296875, -1.580413818359375, -1.52142333984375, -1.462432861328125, -1.4034423828125, -1.344451904296875, -1.28546142578125, -1.226470947265625, -1.16748046875, -1.108489990234375, -1.04949951171875, -0.990509033203125, -0.9315185546875, -0.872528076171875, -0.81353759765625, -0.754547119140625, -0.695556640625, -0.636566162109375, -0.57757568359375, -0.518585205078125, -0.4595947265625, -0.400604248046875, -0.34161376953125, -0.282623291015625, -0.2236328125, -0.164642333984375, -0.10565185546875, -0.046661376953125, 0.0123291015625, 0.071319580078125, 0.13031005859375, 0.189300537109375, 0.248291015625, 0.307281494140625, 0.36627197265625, 0.425262451171875, 0.4842529296875, 0.543243408203125, 0.60223388671875, 0.661224365234375, 0.72021484375, 0.779205322265625, 0.83819580078125, 0.897186279296875, 0.9561767578125, 1.015167236328125, 1.07415771484375, 1.133148193359375, 1.192138671875, 1.251129150390625, 1.31011962890625, 1.369110107421875, 1.4281005859375, 1.487091064453125, 1.54608154296875, 1.605072021484375, 1.6640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 10.0, 19.0, 48.0, 93.0, 221.0, 778.0, 3417.0, 48226.0, 920596.0, 69864.0, 4043.0, 783.0, 241.0, 97.0, 40.0, 35.0, 10.0, 8.0, 5.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.57427978515625, -7.2227783203125, -6.87127685546875, -6.519775390625, -6.16827392578125, -5.8167724609375, -5.46527099609375, -5.11376953125, -4.76226806640625, -4.4107666015625, -4.05926513671875, -3.707763671875, -3.35626220703125, -3.0047607421875, -2.65325927734375, -2.3017578125, -1.95025634765625, -1.5987548828125, -1.24725341796875, -0.895751953125, -0.54425048828125, -0.1927490234375, 0.15875244140625, 0.51025390625, 0.86175537109375, 1.2132568359375, 1.56475830078125, 1.916259765625, 2.26776123046875, 2.6192626953125, 2.97076416015625, 3.322265625, 3.67376708984375, 4.0252685546875, 4.37677001953125, 4.728271484375, 5.07977294921875, 5.4312744140625, 5.78277587890625, 6.13427734375, 6.48577880859375, 6.8372802734375, 7.18878173828125, 7.540283203125, 7.89178466796875, 8.2432861328125, 8.59478759765625, 8.9462890625, 9.29779052734375, 9.6492919921875, 10.00079345703125, 10.352294921875, 10.70379638671875, 11.0552978515625, 11.40679931640625, 11.75830078125, 12.10980224609375, 12.4613037109375, 12.81280517578125, 13.164306640625, 13.51580810546875, 13.8673095703125, 14.21881103515625, 14.5703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 11.0, 22.0, 30.0, 28.0, 36.0, 38.0, 55.0, 66.0, 72.0, 70.0, 83.0, 81.0, 64.0, 57.0, 52.0, 52.0, 48.0, 26.0, 20.0, 15.0, 11.0, 17.0, 7.0, 6.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.4593505859375, -5.184326171875, -4.9093017578125, -4.63427734375, -4.3592529296875, -4.084228515625, -3.8092041015625, -3.5341796875, -3.2591552734375, -2.984130859375, -2.7091064453125, -2.43408203125, -2.1590576171875, -1.884033203125, -1.6090087890625, -1.333984375, -1.0589599609375, -0.783935546875, -0.5089111328125, -0.23388671875, 0.0411376953125, 0.316162109375, 0.5911865234375, 0.8662109375, 1.1412353515625, 1.416259765625, 1.6912841796875, 1.96630859375, 2.2413330078125, 2.516357421875, 2.7913818359375, 3.06640625, 3.3414306640625, 3.616455078125, 3.8914794921875, 4.16650390625, 4.4415283203125, 4.716552734375, 4.9915771484375, 5.2666015625, 5.5416259765625, 5.816650390625, 6.0916748046875, 6.36669921875, 6.6417236328125, 6.916748046875, 7.1917724609375, 7.466796875, 7.7418212890625, 8.016845703125, 8.2918701171875, 8.56689453125, 8.8419189453125, 9.116943359375, 9.3919677734375, 9.6669921875, 9.9420166015625, 10.217041015625, 10.4920654296875, 10.76708984375, 11.0421142578125, 11.317138671875, 11.5921630859375, 11.8671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 14.0, 7.0, 8.0, 18.0, 18.0, 16.0, 30.0, 45.0, 94.0, 132.0, 181.0, 335.0, 583.0, 1237.0, 3189.0, 11082.0, 65106.0, 568168.0, 347003.0, 38894.0, 7671.0, 2411.0, 1010.0, 505.0, 268.0, 178.0, 104.0, 80.0, 41.0, 31.0, 32.0, 11.0, 6.0, 10.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.658203125, -1.607757568359375, -1.55731201171875, -1.506866455078125, -1.4564208984375, -1.405975341796875, -1.35552978515625, -1.305084228515625, -1.254638671875, -1.204193115234375, -1.15374755859375, -1.103302001953125, -1.0528564453125, -1.002410888671875, -0.95196533203125, -0.901519775390625, -0.85107421875, -0.800628662109375, -0.75018310546875, -0.699737548828125, -0.6492919921875, -0.598846435546875, -0.54840087890625, -0.497955322265625, -0.447509765625, -0.397064208984375, -0.34661865234375, -0.296173095703125, -0.2457275390625, -0.195281982421875, -0.14483642578125, -0.094390869140625, -0.0439453125, 0.006500244140625, 0.05694580078125, 0.107391357421875, 0.1578369140625, 0.208282470703125, 0.25872802734375, 0.309173583984375, 0.359619140625, 0.410064697265625, 0.46051025390625, 0.510955810546875, 0.5614013671875, 0.611846923828125, 0.66229248046875, 0.712738037109375, 0.76318359375, 0.813629150390625, 0.86407470703125, 0.914520263671875, 0.9649658203125, 1.015411376953125, 1.06585693359375, 1.116302490234375, 1.166748046875, 1.217193603515625, 1.26763916015625, 1.318084716796875, 1.3685302734375, 1.418975830078125, 1.46942138671875, 1.519866943359375, 1.5703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 11.0, 14.0, 19.0, 22.0, 29.0, 35.0, 46.0, 45.0, 63.0, 53.0, 77.0, 79.0, 70.0, 75.0, 44.0, 59.0, 49.0, 35.0, 29.0, 20.0, 19.0, 13.0, 20.0, 11.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022077560424804688, -0.0002142973244190216, -0.00020781904458999634, -0.00020134076476097107, -0.0001948624849319458, -0.00018838420510292053, -0.00018190592527389526, -0.00017542764544487, -0.00016894936561584473, -0.00016247108578681946, -0.0001559928059577942, -0.00014951452612876892, -0.00014303624629974365, -0.00013655796647071838, -0.00013007968664169312, -0.00012360140681266785, -0.00011712312698364258, -0.00011064484715461731, -0.00010416656732559204, -9.768828749656677e-05, -9.12100076675415e-05, -8.473172783851624e-05, -7.825344800949097e-05, -7.17751681804657e-05, -6.529688835144043e-05, -5.881860852241516e-05, -5.234032869338989e-05, -4.5862048864364624e-05, -3.9383769035339355e-05, -3.290548920631409e-05, -2.642720937728882e-05, -1.994892954826355e-05, -1.3470649719238281e-05, -6.992369890213013e-06, -5.140900611877441e-07, 5.964189767837524e-06, 1.2442469596862793e-05, 1.892074942588806e-05, 2.539902925491333e-05, 3.18773090839386e-05, 3.835558891296387e-05, 4.4833868741989136e-05, 5.1312148571014404e-05, 5.779042840003967e-05, 6.426870822906494e-05, 7.074698805809021e-05, 7.722526788711548e-05, 8.370354771614075e-05, 9.018182754516602e-05, 9.666010737419128e-05, 0.00010313838720321655, 0.00010961666703224182, 0.00011609494686126709, 0.00012257322669029236, 0.00012905150651931763, 0.0001355297863483429, 0.00014200806617736816, 0.00014848634600639343, 0.0001549646258354187, 0.00016144290566444397, 0.00016792118549346924, 0.0001743994653224945, 0.00018087774515151978, 0.00018735602498054504, 0.0001938343048095703]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 12.0, 12.0, 21.0, 45.0, 99.0, 192.0, 522.0, 1704.0, 11326.0, 523906.0, 497016.0, 11021.0, 1735.0, 555.0, 227.0, 77.0, 36.0, 26.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.20562744140625, -3.0987548828125, -2.99188232421875, -2.885009765625, -2.77813720703125, -2.6712646484375, -2.56439208984375, -2.45751953125, -2.35064697265625, -2.2437744140625, -2.13690185546875, -2.030029296875, -1.92315673828125, -1.8162841796875, -1.70941162109375, -1.6025390625, -1.49566650390625, -1.3887939453125, -1.28192138671875, -1.175048828125, -1.06817626953125, -0.9613037109375, -0.85443115234375, -0.74755859375, -0.64068603515625, -0.5338134765625, -0.42694091796875, -0.320068359375, -0.21319580078125, -0.1063232421875, 0.00054931640625, 0.107421875, 0.21429443359375, 0.3211669921875, 0.42803955078125, 0.534912109375, 0.64178466796875, 0.7486572265625, 0.85552978515625, 0.96240234375, 1.06927490234375, 1.1761474609375, 1.28302001953125, 1.389892578125, 1.49676513671875, 1.6036376953125, 1.71051025390625, 1.8173828125, 1.92425537109375, 2.0311279296875, 2.13800048828125, 2.244873046875, 2.35174560546875, 2.4586181640625, 2.56549072265625, 2.67236328125, 2.77923583984375, 2.8861083984375, 2.99298095703125, 3.099853515625, 3.20672607421875, 3.3135986328125, 3.42047119140625, 3.52734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 10.0, 9.0, 20.0, 32.0, 45.0, 61.0, 91.0, 98.0, 145.0, 105.0, 107.0, 86.0, 74.0, 34.0, 32.0, 19.0, 12.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.1865386962890625, -1.108428955078125, -1.0303192138671875, -0.95220947265625, -0.8740997314453125, -0.795989990234375, -0.7178802490234375, -0.6397705078125, -0.5616607666015625, -0.483551025390625, -0.4054412841796875, -0.32733154296875, -0.2492218017578125, -0.171112060546875, -0.0930023193359375, -0.014892578125, 0.0632171630859375, 0.141326904296875, 0.2194366455078125, 0.29754638671875, 0.3756561279296875, 0.453765869140625, 0.5318756103515625, 0.6099853515625, 0.6880950927734375, 0.766204833984375, 0.8443145751953125, 0.92242431640625, 1.0005340576171875, 1.078643798828125, 1.1567535400390625, 1.23486328125, 1.3129730224609375, 1.391082763671875, 1.4691925048828125, 1.54730224609375, 1.6254119873046875, 1.703521728515625, 1.7816314697265625, 1.8597412109375, 1.9378509521484375, 2.015960693359375, 2.0940704345703125, 2.17218017578125, 2.2502899169921875, 2.328399658203125, 2.4065093994140625, 2.484619140625, 2.5627288818359375, 2.640838623046875, 2.7189483642578125, 2.79705810546875, 2.8751678466796875, 2.953277587890625, 3.0313873291015625, 3.1094970703125, 3.1876068115234375, 3.265716552734375, 3.3438262939453125, 3.42193603515625, 3.5000457763671875, 3.578155517578125, 3.6562652587890625, 3.734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 36.0, 75.0, 122.0, 226.0, 228.0, 134.0, 91.0, 46.0, 18.0, 7.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.32183074951172, -56.514591217041016, -54.70735168457031, -52.900108337402344, -51.09286880493164, -49.28562927246094, -47.478389739990234, -45.67115020751953, -43.86390686035156, -42.05666732788086, -40.249427795410156, -38.44218444824219, -36.634944915771484, -34.82770538330078, -33.02046585083008, -31.213226318359375, -29.405986785888672, -27.59874725341797, -25.791505813598633, -23.98426628112793, -22.177024841308594, -20.36978530883789, -18.562545776367188, -16.755306243896484, -14.948064804077148, -13.140824317932129, -11.33358383178711, -9.526344299316406, -7.719103813171387, -5.911863327026367, -4.104623794555664, -2.2973833084106445, -0.490142822265625, 1.3170974254608154, 3.124337673187256, 4.931577682495117, 6.738818168640137, 8.546058654785156, 10.35329818725586, 12.160538673400879, 13.967779159545898, 15.775019645690918, 17.582260131835938, 19.38949966430664, 21.196739196777344, 23.00398063659668, 24.811220169067383, 26.61846160888672, 28.425701141357422, 30.232940673828125, 32.04018020629883, 33.84741973876953, 35.6546630859375, 37.4619026184082, 39.269142150878906, 41.07638168334961, 42.88362121582031, 44.690860748291016, 46.49810028076172, 48.30534362792969, 50.11258316040039, 51.919822692871094, 53.7270622253418, 55.5343017578125, 57.34154510498047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 12.0, 13.0, 20.0, 16.0, 25.0, 16.0, 27.0, 37.0, 40.0, 40.0, 34.0, 62.0, 65.0, 62.0, 58.0, 69.0, 50.0, 52.0, 43.0, 46.0, 32.0, 37.0, 19.0, 25.0, 17.0, 22.0, 11.0, 7.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.696685791015625, -33.67158889770508, -32.64649200439453, -31.62139129638672, -30.596294403076172, -29.571197509765625, -28.546098709106445, -27.520999908447266, -26.49590301513672, -25.470806121826172, -24.445707321166992, -23.420608520507812, -22.395511627197266, -21.37041473388672, -20.34531593322754, -19.32021713256836, -18.295120239257812, -17.270023345947266, -16.244924545288086, -15.219826698303223, -14.19472885131836, -13.169631004333496, -12.144533157348633, -11.11943531036377, -10.094337463378906, -9.069239616394043, -8.04414176940918, -7.019043922424316, -5.993946075439453, -4.96884822845459, -3.9437503814697266, -2.9186525344848633, -1.8935585021972656, -0.8684606552124023, 0.15663719177246094, 1.1817350387573242, 2.2068328857421875, 3.231930732727051, 4.257028579711914, 5.282126426696777, 6.307224273681641, 7.332322120666504, 8.357419967651367, 9.38251781463623, 10.407615661621094, 11.432713508605957, 12.45781135559082, 13.482909202575684, 14.508007049560547, 15.53310489654541, 16.558202743530273, 17.583301544189453, 18.6083984375, 19.633495330810547, 20.658594131469727, 21.683692932128906, 22.708789825439453, 23.73388671875, 24.75898551940918, 25.78408432006836, 26.809181213378906, 27.834278106689453, 28.859376907348633, 29.884475708007812, 30.90957260131836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 15.0, 20.0, 10.0, 23.0, 49.0, 59.0, 86.0, 166.0, 271.0, 590.0, 1344.0, 3577.0, 12022.0, 62283.0, 2812317.0, 1236787.0, 49023.0, 10328.0, 3156.0, 1163.0, 495.0, 214.0, 134.0, 57.0, 35.0, 13.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.15234375, -6.021240234375, -5.89013671875, -5.759033203125, -5.6279296875, -5.496826171875, -5.36572265625, -5.234619140625, -5.103515625, -4.972412109375, -4.84130859375, -4.710205078125, -4.5791015625, -4.447998046875, -4.31689453125, -4.185791015625, -4.0546875, -3.923583984375, -3.79248046875, -3.661376953125, -3.5302734375, -3.399169921875, -3.26806640625, -3.136962890625, -3.005859375, -2.874755859375, -2.74365234375, -2.612548828125, -2.4814453125, -2.350341796875, -2.21923828125, -2.088134765625, -1.95703125, -1.825927734375, -1.69482421875, -1.563720703125, -1.4326171875, -1.301513671875, -1.17041015625, -1.039306640625, -0.908203125, -0.777099609375, -0.64599609375, -0.514892578125, -0.3837890625, -0.252685546875, -0.12158203125, 0.009521484375, 0.140625, 0.271728515625, 0.40283203125, 0.533935546875, 0.6650390625, 0.796142578125, 0.92724609375, 1.058349609375, 1.189453125, 1.320556640625, 1.45166015625, 1.582763671875, 1.7138671875, 1.844970703125, 1.97607421875, 2.107177734375, 2.23828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 3.0, 8.0, 6.0, 14.0, 19.0, 17.0, 33.0, 30.0, 30.0, 44.0, 49.0, 57.0, 75.0, 58.0, 64.0, 56.0, 65.0, 60.0, 47.0, 48.0, 37.0, 45.0, 27.0, 25.0, 27.0, 10.0, 16.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.45074462890625, -1.4063720703125, -1.36199951171875, -1.317626953125, -1.27325439453125, -1.2288818359375, -1.18450927734375, -1.14013671875, -1.09576416015625, -1.0513916015625, -1.00701904296875, -0.962646484375, -0.91827392578125, -0.8739013671875, -0.82952880859375, -0.78515625, -0.74078369140625, -0.6964111328125, -0.65203857421875, -0.607666015625, -0.56329345703125, -0.5189208984375, -0.47454833984375, -0.43017578125, -0.38580322265625, -0.3414306640625, -0.29705810546875, -0.252685546875, -0.20831298828125, -0.1639404296875, -0.11956787109375, -0.0751953125, -0.03082275390625, 0.0135498046875, 0.05792236328125, 0.102294921875, 0.14666748046875, 0.1910400390625, 0.23541259765625, 0.27978515625, 0.32415771484375, 0.3685302734375, 0.41290283203125, 0.457275390625, 0.50164794921875, 0.5460205078125, 0.59039306640625, 0.634765625, 0.67913818359375, 0.7235107421875, 0.76788330078125, 0.812255859375, 0.85662841796875, 0.9010009765625, 0.94537353515625, 0.98974609375, 1.03411865234375, 1.0784912109375, 1.12286376953125, 1.167236328125, 1.21160888671875, 1.2559814453125, 1.30035400390625, 1.3447265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 14.0, 22.0, 25.0, 37.0, 58.0, 107.0, 154.0, 291.0, 490.0, 1049.0, 2151.0, 5176.0, 15101.0, 58055.0, 503586.0, 3390864.0, 167979.0, 32564.0, 9694.0, 3566.0, 1567.0, 742.0, 368.0, 226.0, 151.0, 81.0, 41.0, 23.0, 24.0, 11.0, 12.0, 10.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-4.203125, -4.090423583984375, -3.97772216796875, -3.865020751953125, -3.7523193359375, -3.639617919921875, -3.52691650390625, -3.414215087890625, -3.301513671875, -3.188812255859375, -3.07611083984375, -2.963409423828125, -2.8507080078125, -2.738006591796875, -2.62530517578125, -2.512603759765625, -2.39990234375, -2.287200927734375, -2.17449951171875, -2.061798095703125, -1.9490966796875, -1.836395263671875, -1.72369384765625, -1.610992431640625, -1.498291015625, -1.385589599609375, -1.27288818359375, -1.160186767578125, -1.0474853515625, -0.934783935546875, -0.82208251953125, -0.709381103515625, -0.5966796875, -0.483978271484375, -0.37127685546875, -0.258575439453125, -0.1458740234375, -0.033172607421875, 0.07952880859375, 0.192230224609375, 0.304931640625, 0.417633056640625, 0.53033447265625, 0.643035888671875, 0.7557373046875, 0.868438720703125, 0.98114013671875, 1.093841552734375, 1.20654296875, 1.319244384765625, 1.43194580078125, 1.544647216796875, 1.6573486328125, 1.770050048828125, 1.88275146484375, 1.995452880859375, 2.108154296875, 2.220855712890625, 2.33355712890625, 2.446258544921875, 2.5589599609375, 2.671661376953125, 2.78436279296875, 2.897064208984375, 3.009765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 14.0, 7.0, 16.0, 31.0, 34.0, 43.0, 71.0, 117.0, 188.0, 408.0, 846.0, 1104.0, 501.0, 215.0, 129.0, 85.0, 55.0, 37.0, 42.0, 23.0, 19.0, 11.0, 13.0, 11.0, 4.0, 5.0, 3.0, 6.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.171875, -4.056671142578125, -3.94146728515625, -3.826263427734375, -3.7110595703125, -3.595855712890625, -3.48065185546875, -3.365447998046875, -3.250244140625, -3.135040283203125, -3.01983642578125, -2.904632568359375, -2.7894287109375, -2.674224853515625, -2.55902099609375, -2.443817138671875, -2.32861328125, -2.213409423828125, -2.09820556640625, -1.983001708984375, -1.8677978515625, -1.752593994140625, -1.63739013671875, -1.522186279296875, -1.406982421875, -1.291778564453125, -1.17657470703125, -1.061370849609375, -0.9461669921875, -0.830963134765625, -0.71575927734375, -0.600555419921875, -0.4853515625, -0.370147705078125, -0.25494384765625, -0.139739990234375, -0.0245361328125, 0.090667724609375, 0.20587158203125, 0.321075439453125, 0.436279296875, 0.551483154296875, 0.66668701171875, 0.781890869140625, 0.8970947265625, 1.012298583984375, 1.12750244140625, 1.242706298828125, 1.35791015625, 1.473114013671875, 1.58831787109375, 1.703521728515625, 1.8187255859375, 1.933929443359375, 2.04913330078125, 2.164337158203125, 2.279541015625, 2.394744873046875, 2.50994873046875, 2.625152587890625, 2.7403564453125, 2.855560302734375, 2.97076416015625, 3.085968017578125, 3.201171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 18.0, 34.0, 58.0, 107.0, 173.0, 203.0, 149.0, 115.0, 55.0, 29.0, 18.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.90979766845703, -41.7921257019043, -40.67445373535156, -39.55678176879883, -38.439109802246094, -37.321441650390625, -36.203765869140625, -35.086097717285156, -33.96842575073242, -32.85075378417969, -31.733081817626953, -30.61540985107422, -29.497739791870117, -28.380067825317383, -27.26239585876465, -26.144723892211914, -25.02705192565918, -23.909379959106445, -22.79170799255371, -21.67403793334961, -20.556365966796875, -19.43869400024414, -18.321022033691406, -17.203350067138672, -16.085678100585938, -14.968006134033203, -13.850335121154785, -12.73266315460205, -11.614992141723633, -10.497320175170898, -9.379648208618164, -8.26197624206543, -7.144306182861328, -6.026634693145752, -4.908963203430176, -3.7912912368774414, -2.6736197471618652, -1.555948257446289, -0.4382762908935547, 0.6793951988220215, 1.7970666885375977, 2.914738178253174, 4.03240966796875, 5.150081634521484, 6.2677531242370605, 7.385424613952637, 8.503096580505371, 9.620767593383789, 10.738439559936523, 11.856111526489258, 12.973782539367676, 14.09145450592041, 15.209125518798828, 16.326797485351562, 17.444469451904297, 18.56214141845703, 19.679813385009766, 20.7974853515625, 21.915157318115234, 23.03282928466797, 24.15049934387207, 25.268171310424805, 26.38584327697754, 27.503515243530273, 28.621185302734375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 10.0, 8.0, 14.0, 7.0, 25.0, 13.0, 31.0, 27.0, 41.0, 39.0, 36.0, 46.0, 56.0, 40.0, 77.0, 52.0, 53.0, 46.0, 43.0, 47.0, 39.0, 30.0, 34.0, 26.0, 33.0, 26.0, 9.0, 12.0, 15.0, 9.0, 13.0, 11.0, 4.0, 2.0, 6.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.761592864990234, -18.23255157470703, -17.70351219177246, -17.174470901489258, -16.645431518554688, -16.116390228271484, -15.587348937988281, -15.058308601379395, -14.529268264770508, -14.000227928161621, -13.471187591552734, -12.942146301269531, -12.413105964660645, -11.884065628051758, -11.355024337768555, -10.825984001159668, -10.296943664550781, -9.767903327941895, -9.238862991333008, -8.709821701049805, -8.180781364440918, -7.651741027832031, -7.122700214385986, -6.593659400939941, -6.064619064331055, -5.535578727722168, -5.006537914276123, -4.477497100830078, -3.9484567642211914, -3.4194161891937256, -2.8903756141662598, -2.361335039138794, -1.832296371459961, -1.3032557964324951, -0.7742152214050293, -0.24517464637756348, 0.28386592864990234, 0.8129065036773682, 1.341947078704834, 1.8709876537322998, 2.4000282287597656, 2.9290688037872314, 3.4581093788146973, 3.987149953842163, 4.516190528869629, 5.045230865478516, 5.5742716789245605, 6.1033124923706055, 6.632352828979492, 7.161393165588379, 7.690433979034424, 8.219474792480469, 8.748515129089355, 9.277555465698242, 9.806596755981445, 10.335637092590332, 10.864677429199219, 11.393717765808105, 11.922758102416992, 12.451799392700195, 12.980839729309082, 13.509880065917969, 14.038921356201172, 14.567961692810059, 15.097002029418945]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 9.0, 13.0, 14.0, 39.0, 44.0, 57.0, 87.0, 136.0, 225.0, 372.0, 611.0, 1027.0, 1745.0, 2925.0, 5218.0, 10125.0, 20121.0, 41219.0, 86659.0, 171492.0, 259526.0, 215197.0, 117379.0, 57169.0, 27396.0, 13557.0, 7027.0, 3845.0, 2116.0, 1196.0, 734.0, 435.0, 279.0, 188.0, 119.0, 89.0, 60.0, 33.0, 22.0, 17.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.9013671875, -1.8509521484375, -1.800537109375, -1.7501220703125, -1.69970703125, -1.6492919921875, -1.598876953125, -1.5484619140625, -1.498046875, -1.4476318359375, -1.397216796875, -1.3468017578125, -1.29638671875, -1.2459716796875, -1.195556640625, -1.1451416015625, -1.0947265625, -1.0443115234375, -0.993896484375, -0.9434814453125, -0.89306640625, -0.8426513671875, -0.792236328125, -0.7418212890625, -0.69140625, -0.6409912109375, -0.590576171875, -0.5401611328125, -0.48974609375, -0.4393310546875, -0.388916015625, -0.3385009765625, -0.2880859375, -0.2376708984375, -0.187255859375, -0.1368408203125, -0.08642578125, -0.0360107421875, 0.014404296875, 0.0648193359375, 0.115234375, 0.1656494140625, 0.216064453125, 0.2664794921875, 0.31689453125, 0.3673095703125, 0.417724609375, 0.4681396484375, 0.5185546875, 0.5689697265625, 0.619384765625, 0.6697998046875, 0.72021484375, 0.7706298828125, 0.821044921875, 0.8714599609375, 0.921875, 0.9722900390625, 1.022705078125, 1.0731201171875, 1.12353515625, 1.1739501953125, 1.224365234375, 1.2747802734375, 1.3251953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 2.0, 7.0, 11.0, 13.0, 23.0, 20.0, 24.0, 24.0, 22.0, 25.0, 50.0, 56.0, 42.0, 44.0, 46.0, 51.0, 46.0, 52.0, 46.0, 44.0, 50.0, 42.0, 33.0, 36.0, 36.0, 23.0, 23.0, 29.0, 13.0, 10.0, 16.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0185546875, -0.983154296875, -0.94775390625, -0.912353515625, -0.876953125, -0.841552734375, -0.80615234375, -0.770751953125, -0.7353515625, -0.699951171875, -0.66455078125, -0.629150390625, -0.59375, -0.558349609375, -0.52294921875, -0.487548828125, -0.4521484375, -0.416748046875, -0.38134765625, -0.345947265625, -0.310546875, -0.275146484375, -0.23974609375, -0.204345703125, -0.1689453125, -0.133544921875, -0.09814453125, -0.062744140625, -0.02734375, 0.008056640625, 0.04345703125, 0.078857421875, 0.1142578125, 0.149658203125, 0.18505859375, 0.220458984375, 0.255859375, 0.291259765625, 0.32666015625, 0.362060546875, 0.3974609375, 0.432861328125, 0.46826171875, 0.503662109375, 0.5390625, 0.574462890625, 0.60986328125, 0.645263671875, 0.6806640625, 0.716064453125, 0.75146484375, 0.786865234375, 0.822265625, 0.857666015625, 0.89306640625, 0.928466796875, 0.9638671875, 0.999267578125, 1.03466796875, 1.070068359375, 1.10546875, 1.140869140625, 1.17626953125, 1.211669921875, 1.2470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 9.0, 8.0, 14.0, 16.0, 43.0, 57.0, 97.0, 159.0, 232.0, 373.0, 622.0, 1161.0, 2628.0, 7727.0, 35589.0, 243117.0, 623211.0, 106751.0, 17871.0, 4677.0, 1900.0, 929.0, 529.0, 293.0, 192.0, 103.0, 75.0, 59.0, 38.0, 23.0, 13.0, 11.0, 6.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.701446533203125, -4.57867431640625, -4.455902099609375, -4.3331298828125, -4.210357666015625, -4.08758544921875, -3.964813232421875, -3.842041015625, -3.719268798828125, -3.59649658203125, -3.473724365234375, -3.3509521484375, -3.228179931640625, -3.10540771484375, -2.982635498046875, -2.85986328125, -2.737091064453125, -2.61431884765625, -2.491546630859375, -2.3687744140625, -2.246002197265625, -2.12322998046875, -2.000457763671875, -1.877685546875, -1.754913330078125, -1.63214111328125, -1.509368896484375, -1.3865966796875, -1.263824462890625, -1.14105224609375, -1.018280029296875, -0.8955078125, -0.772735595703125, -0.64996337890625, -0.527191162109375, -0.4044189453125, -0.281646728515625, -0.15887451171875, -0.036102294921875, 0.086669921875, 0.209442138671875, 0.33221435546875, 0.454986572265625, 0.5777587890625, 0.700531005859375, 0.82330322265625, 0.946075439453125, 1.06884765625, 1.191619873046875, 1.31439208984375, 1.437164306640625, 1.5599365234375, 1.682708740234375, 1.80548095703125, 1.928253173828125, 2.051025390625, 2.173797607421875, 2.29656982421875, 2.419342041015625, 2.5421142578125, 2.664886474609375, 2.78765869140625, 2.910430908203125, 3.033203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 9.0, 15.0, 16.0, 20.0, 21.0, 33.0, 34.0, 34.0, 36.0, 48.0, 46.0, 65.0, 50.0, 53.0, 50.0, 60.0, 47.0, 59.0, 41.0, 40.0, 36.0, 30.0, 30.0, 22.0, 24.0, 13.0, 13.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.50421142578125, -5.3365478515625, -5.16888427734375, -5.001220703125, -4.83355712890625, -4.6658935546875, -4.49822998046875, -4.33056640625, -4.16290283203125, -3.9952392578125, -3.82757568359375, -3.659912109375, -3.49224853515625, -3.3245849609375, -3.15692138671875, -2.9892578125, -2.82159423828125, -2.6539306640625, -2.48626708984375, -2.318603515625, -2.15093994140625, -1.9832763671875, -1.81561279296875, -1.64794921875, -1.48028564453125, -1.3126220703125, -1.14495849609375, -0.977294921875, -0.80963134765625, -0.6419677734375, -0.47430419921875, -0.306640625, -0.13897705078125, 0.0286865234375, 0.19635009765625, 0.364013671875, 0.53167724609375, 0.6993408203125, 0.86700439453125, 1.03466796875, 1.20233154296875, 1.3699951171875, 1.53765869140625, 1.705322265625, 1.87298583984375, 2.0406494140625, 2.20831298828125, 2.3759765625, 2.54364013671875, 2.7113037109375, 2.87896728515625, 3.046630859375, 3.21429443359375, 3.3819580078125, 3.54962158203125, 3.71728515625, 3.88494873046875, 4.0526123046875, 4.22027587890625, 4.387939453125, 4.55560302734375, 4.7232666015625, 4.89093017578125, 5.05859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 10.0, 7.0, 16.0, 11.0, 22.0, 33.0, 57.0, 81.0, 154.0, 307.0, 710.0, 1911.0, 7896.0, 63118.0, 802604.0, 153452.0, 13506.0, 2884.0, 962.0, 365.0, 180.0, 99.0, 62.0, 31.0, 29.0, 19.0, 14.0, 6.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9207763671875, -1.851318359375, -1.7818603515625, -1.71240234375, -1.6429443359375, -1.573486328125, -1.5040283203125, -1.4345703125, -1.3651123046875, -1.295654296875, -1.2261962890625, -1.15673828125, -1.0872802734375, -1.017822265625, -0.9483642578125, -0.87890625, -0.8094482421875, -0.739990234375, -0.6705322265625, -0.60107421875, -0.5316162109375, -0.462158203125, -0.3927001953125, -0.3232421875, -0.2537841796875, -0.184326171875, -0.1148681640625, -0.04541015625, 0.0240478515625, 0.093505859375, 0.1629638671875, 0.232421875, 0.3018798828125, 0.371337890625, 0.4407958984375, 0.51025390625, 0.5797119140625, 0.649169921875, 0.7186279296875, 0.7880859375, 0.8575439453125, 0.927001953125, 0.9964599609375, 1.06591796875, 1.1353759765625, 1.204833984375, 1.2742919921875, 1.34375, 1.4132080078125, 1.482666015625, 1.5521240234375, 1.62158203125, 1.6910400390625, 1.760498046875, 1.8299560546875, 1.8994140625, 1.9688720703125, 2.038330078125, 2.1077880859375, 2.17724609375, 2.2467041015625, 2.316162109375, 2.3856201171875, 2.455078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 12.0, 27.0, 51.0, 64.0, 108.0, 128.0, 141.0, 130.0, 105.0, 63.0, 38.0, 33.0, 24.0, 10.0, 15.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005822181701660156, -0.0005674064159393311, -0.0005525946617126465, -0.0005377829074859619, -0.0005229711532592773, -0.0005081593990325928, -0.0004933476448059082, -0.00047853589057922363, -0.00046372413635253906, -0.0004489123821258545, -0.0004341006278991699, -0.00041928887367248535, -0.0004044771194458008, -0.0003896653652191162, -0.00037485361099243164, -0.00036004185676574707, -0.0003452301025390625, -0.00033041834831237793, -0.00031560659408569336, -0.0003007948398590088, -0.0002859830856323242, -0.00027117133140563965, -0.0002563595771789551, -0.0002415478229522705, -0.00022673606872558594, -0.00021192431449890137, -0.0001971125602722168, -0.00018230080604553223, -0.00016748905181884766, -0.00015267729759216309, -0.00013786554336547852, -0.00012305378913879395, -0.00010824203491210938, -9.34302806854248e-05, -7.861852645874023e-05, -6.380677223205566e-05, -4.8995018005371094e-05, -3.4183263778686523e-05, -1.9371509552001953e-05, -4.559755325317383e-06, 1.0251998901367188e-05, 2.5063753128051758e-05, 3.987550735473633e-05, 5.46872615814209e-05, 6.949901580810547e-05, 8.431077003479004e-05, 9.912252426147461e-05, 0.00011393427848815918, 0.00012874603271484375, 0.00014355778694152832, 0.0001583695411682129, 0.00017318129539489746, 0.00018799304962158203, 0.0002028048038482666, 0.00021761655807495117, 0.00023242831230163574, 0.0002472400665283203, 0.0002620518207550049, 0.00027686357498168945, 0.000291675329208374, 0.0003064870834350586, 0.00032129883766174316, 0.00033611059188842773, 0.0003509223461151123, 0.0003657341003417969]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 9.0, 16.0, 12.0, 30.0, 44.0, 50.0, 115.0, 166.0, 295.0, 508.0, 1032.0, 2471.0, 7251.0, 33325.0, 305636.0, 616634.0, 63603.0, 11193.0, 3291.0, 1327.0, 677.0, 337.0, 202.0, 108.0, 73.0, 49.0, 26.0, 23.0, 11.0, 8.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1523895263671875, -1.102630615234375, -1.0528717041015625, -1.00311279296875, -0.9533538818359375, -0.903594970703125, -0.8538360595703125, -0.8040771484375, -0.7543182373046875, -0.704559326171875, -0.6548004150390625, -0.60504150390625, -0.5552825927734375, -0.505523681640625, -0.4557647705078125, -0.406005859375, -0.3562469482421875, -0.306488037109375, -0.2567291259765625, -0.20697021484375, -0.1572113037109375, -0.107452392578125, -0.0576934814453125, -0.0079345703125, 0.0418243408203125, 0.091583251953125, 0.1413421630859375, 0.19110107421875, 0.2408599853515625, 0.290618896484375, 0.3403778076171875, 0.39013671875, 0.4398956298828125, 0.489654541015625, 0.5394134521484375, 0.58917236328125, 0.6389312744140625, 0.688690185546875, 0.7384490966796875, 0.7882080078125, 0.8379669189453125, 0.887725830078125, 0.9374847412109375, 0.98724365234375, 1.0370025634765625, 1.086761474609375, 1.1365203857421875, 1.186279296875, 1.2360382080078125, 1.285797119140625, 1.3355560302734375, 1.38531494140625, 1.4350738525390625, 1.484832763671875, 1.5345916748046875, 1.5843505859375, 1.6341094970703125, 1.683868408203125, 1.7336273193359375, 1.78338623046875, 1.8331451416015625, 1.882904052734375, 1.9326629638671875, 1.982421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 11.0, 27.0, 24.0, 45.0, 46.0, 71.0, 93.0, 126.0, 118.0, 110.0, 85.0, 73.0, 43.0, 36.0, 26.0, 16.0, 15.0, 7.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.03863525390625, -1.9718017578125, -1.90496826171875, -1.838134765625, -1.77130126953125, -1.7044677734375, -1.63763427734375, -1.57080078125, -1.50396728515625, -1.4371337890625, -1.37030029296875, -1.303466796875, -1.23663330078125, -1.1697998046875, -1.10296630859375, -1.0361328125, -0.96929931640625, -0.9024658203125, -0.83563232421875, -0.768798828125, -0.70196533203125, -0.6351318359375, -0.56829833984375, -0.50146484375, -0.43463134765625, -0.3677978515625, -0.30096435546875, -0.234130859375, -0.16729736328125, -0.1004638671875, -0.03363037109375, 0.033203125, 0.10003662109375, 0.1668701171875, 0.23370361328125, 0.300537109375, 0.36737060546875, 0.4342041015625, 0.50103759765625, 0.56787109375, 0.63470458984375, 0.7015380859375, 0.76837158203125, 0.835205078125, 0.90203857421875, 0.9688720703125, 1.03570556640625, 1.1025390625, 1.16937255859375, 1.2362060546875, 1.30303955078125, 1.369873046875, 1.43670654296875, 1.5035400390625, 1.57037353515625, 1.63720703125, 1.70404052734375, 1.7708740234375, 1.83770751953125, 1.904541015625, 1.97137451171875, 2.0382080078125, 2.10504150390625, 2.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 20.0, 27.0, 108.0, 183.0, 302.0, 211.0, 91.0, 34.0, 15.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.68215942382812, -68.04549407958984, -66.40882110595703, -64.77215576171875, -63.13548278808594, -61.49881362915039, -59.862144470214844, -58.22547912597656, -56.58880615234375, -54.9521369934082, -53.315467834472656, -51.67879867553711, -50.04212951660156, -48.405460357666016, -46.76879119873047, -45.13212585449219, -43.49545669555664, -41.858787536621094, -40.22211837768555, -38.58544921875, -36.94878005981445, -35.312110900878906, -33.675445556640625, -32.03877258300781, -30.4021053314209, -28.76543617248535, -27.128767013549805, -25.49209976196289, -23.855430603027344, -22.218761444091797, -20.58209228515625, -18.945423126220703, -17.308757781982422, -15.672088623046875, -14.035419464111328, -12.398751258850098, -10.76208209991455, -9.125412940979004, -7.488744735717773, -5.852075576782227, -4.21540641784668, -2.578737497329712, -0.9420685768127441, 0.6946001052856445, 2.3312692642211914, 3.9679384231567383, 5.604606628417969, 7.241275787353516, 8.877944946289062, 10.51461410522461, 12.151283264160156, 13.787951469421387, 15.424620628356934, 17.061290740966797, 18.69795799255371, 20.334627151489258, 21.971296310424805, 23.60796546936035, 25.2446346282959, 26.881301879882812, 28.51797103881836, 30.154640197753906, 31.791309356689453, 33.427978515625, 35.06464767456055]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 13.0, 13.0, 16.0, 20.0, 22.0, 33.0, 29.0, 52.0, 41.0, 51.0, 51.0, 64.0, 81.0, 81.0, 66.0, 68.0, 61.0, 43.0, 30.0, 35.0, 22.0, 22.0, 21.0, 17.0, 10.0, 8.0, 7.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.02332305908203, -28.27657127380371, -27.52981948852539, -26.78306770324707, -26.03631591796875, -25.289566040039062, -24.542814254760742, -23.796062469482422, -23.0493106842041, -22.30255889892578, -21.55580711364746, -20.80905532836914, -20.062305450439453, -19.315553665161133, -18.568801879882812, -17.822050094604492, -17.075298309326172, -16.32854652404785, -15.581794738769531, -14.835043907165527, -14.088292121887207, -13.341540336608887, -12.594789505004883, -11.848037719726562, -11.101285934448242, -10.354534149169922, -9.607782363891602, -8.861031532287598, -8.114279747009277, -7.367527961730957, -6.620776653289795, -5.874025344848633, -5.1272735595703125, -4.380521774291992, -3.63377046585083, -2.887018918991089, -2.1402673721313477, -1.3935158252716064, -0.6467642784118652, 0.09998703002929688, 0.8467388153076172, 1.5934903621673584, 2.3402419090270996, 3.086993455886841, 3.833745002746582, 4.580496788024902, 5.3272480964660645, 6.073999404907227, 6.820751190185547, 7.567502975463867, 8.314254760742188, 9.061005592346191, 9.807757377624512, 10.554509162902832, 11.301259994506836, 12.048011779785156, 12.794763565063477, 13.541515350341797, 14.288267135620117, 15.035017967224121, 15.781769752502441, 16.528520584106445, 17.275272369384766, 18.022024154663086, 18.768775939941406]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 5.0, 9.0, 12.0, 25.0, 31.0, 40.0, 74.0, 105.0, 204.0, 504.0, 1642.0, 7166.0, 51631.0, 3670771.0, 436626.0, 19822.0, 3949.0, 969.0, 332.0, 120.0, 69.0, 58.0, 21.0, 31.0, 7.0, 8.0, 7.0, 4.0, 12.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.753936767578125, -4.61724853515625, -4.480560302734375, -4.3438720703125, -4.207183837890625, -4.07049560546875, -3.933807373046875, -3.797119140625, -3.660430908203125, -3.52374267578125, -3.387054443359375, -3.2503662109375, -3.113677978515625, -2.97698974609375, -2.840301513671875, -2.70361328125, -2.566925048828125, -2.43023681640625, -2.293548583984375, -2.1568603515625, -2.020172119140625, -1.88348388671875, -1.746795654296875, -1.610107421875, -1.473419189453125, -1.33673095703125, -1.200042724609375, -1.0633544921875, -0.926666259765625, -0.78997802734375, -0.653289794921875, -0.5166015625, -0.379913330078125, -0.24322509765625, -0.106536865234375, 0.0301513671875, 0.166839599609375, 0.30352783203125, 0.440216064453125, 0.576904296875, 0.713592529296875, 0.85028076171875, 0.986968994140625, 1.1236572265625, 1.260345458984375, 1.39703369140625, 1.533721923828125, 1.67041015625, 1.807098388671875, 1.94378662109375, 2.080474853515625, 2.2171630859375, 2.353851318359375, 2.49053955078125, 2.627227783203125, 2.763916015625, 2.900604248046875, 3.03729248046875, 3.173980712890625, 3.3106689453125, 3.447357177734375, 3.58404541015625, 3.720733642578125, 3.857421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 15.0, 17.0, 36.0, 57.0, 54.0, 76.0, 102.0, 103.0, 109.0, 98.0, 82.0, 80.0, 51.0, 45.0, 31.0, 21.0, 11.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.08984375, -3.0200958251953125, -2.950347900390625, -2.8805999755859375, -2.81085205078125, -2.7411041259765625, -2.671356201171875, -2.6016082763671875, -2.5318603515625, -2.4621124267578125, -2.392364501953125, -2.3226165771484375, -2.25286865234375, -2.1831207275390625, -2.113372802734375, -2.0436248779296875, -1.973876953125, -1.9041290283203125, -1.834381103515625, -1.7646331787109375, -1.69488525390625, -1.6251373291015625, -1.555389404296875, -1.4856414794921875, -1.4158935546875, -1.3461456298828125, -1.276397705078125, -1.2066497802734375, -1.13690185546875, -1.0671539306640625, -0.997406005859375, -0.9276580810546875, -0.85791015625, -0.7881622314453125, -0.718414306640625, -0.6486663818359375, -0.57891845703125, -0.5091705322265625, -0.439422607421875, -0.3696746826171875, -0.2999267578125, -0.2301788330078125, -0.160430908203125, -0.0906829833984375, -0.02093505859375, 0.0488128662109375, 0.118560791015625, 0.1883087158203125, 0.258056640625, 0.3278045654296875, 0.397552490234375, 0.4673004150390625, 0.53704833984375, 0.6067962646484375, 0.676544189453125, 0.7462921142578125, 0.8160400390625, 0.8857879638671875, 0.955535888671875, 1.0252838134765625, 1.09503173828125, 1.1647796630859375, 1.234527587890625, 1.3042755126953125, 1.3740234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 13.0, 19.0, 16.0, 36.0, 54.0, 102.0, 203.0, 372.0, 863.0, 1899.0, 4603.0, 12051.0, 35270.0, 153371.0, 2743889.0, 1107364.0, 93040.0, 25451.0, 8954.0, 3487.0, 1555.0, 765.0, 398.0, 222.0, 115.0, 65.0, 35.0, 31.0, 12.0, 8.0, 4.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.656829833984375, -2.57342529296875, -2.490020751953125, -2.4066162109375, -2.323211669921875, -2.23980712890625, -2.156402587890625, -2.072998046875, -1.989593505859375, -1.90618896484375, -1.822784423828125, -1.7393798828125, -1.655975341796875, -1.57257080078125, -1.489166259765625, -1.40576171875, -1.322357177734375, -1.23895263671875, -1.155548095703125, -1.0721435546875, -0.988739013671875, -0.90533447265625, -0.821929931640625, -0.738525390625, -0.655120849609375, -0.57171630859375, -0.488311767578125, -0.4049072265625, -0.321502685546875, -0.23809814453125, -0.154693603515625, -0.0712890625, 0.012115478515625, 0.09552001953125, 0.178924560546875, 0.2623291015625, 0.345733642578125, 0.42913818359375, 0.512542724609375, 0.595947265625, 0.679351806640625, 0.76275634765625, 0.846160888671875, 0.9295654296875, 1.012969970703125, 1.09637451171875, 1.179779052734375, 1.26318359375, 1.346588134765625, 1.42999267578125, 1.513397216796875, 1.5968017578125, 1.680206298828125, 1.76361083984375, 1.847015380859375, 1.930419921875, 2.013824462890625, 2.09722900390625, 2.180633544921875, 2.2640380859375, 2.347442626953125, 2.43084716796875, 2.514251708984375, 2.59765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 19.0, 12.0, 35.0, 32.0, 67.0, 86.0, 137.0, 288.0, 529.0, 858.0, 783.0, 458.0, 237.0, 158.0, 88.0, 60.0, 28.0, 23.0, 27.0, 14.0, 24.0, 9.0, 3.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.01348876953125, -1.9293212890625, -1.84515380859375, -1.760986328125, -1.67681884765625, -1.5926513671875, -1.50848388671875, -1.42431640625, -1.34014892578125, -1.2559814453125, -1.17181396484375, -1.087646484375, -1.00347900390625, -0.9193115234375, -0.83514404296875, -0.7509765625, -0.66680908203125, -0.5826416015625, -0.49847412109375, -0.414306640625, -0.33013916015625, -0.2459716796875, -0.16180419921875, -0.07763671875, 0.00653076171875, 0.0906982421875, 0.17486572265625, 0.259033203125, 0.34320068359375, 0.4273681640625, 0.51153564453125, 0.595703125, 0.67987060546875, 0.7640380859375, 0.84820556640625, 0.932373046875, 1.01654052734375, 1.1007080078125, 1.18487548828125, 1.26904296875, 1.35321044921875, 1.4373779296875, 1.52154541015625, 1.605712890625, 1.68988037109375, 1.7740478515625, 1.85821533203125, 1.9423828125, 2.02655029296875, 2.1107177734375, 2.19488525390625, 2.279052734375, 2.36322021484375, 2.4473876953125, 2.53155517578125, 2.61572265625, 2.69989013671875, 2.7840576171875, 2.86822509765625, 2.952392578125, 3.03656005859375, 3.1207275390625, 3.20489501953125, 3.2890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 93.0, 186.0, 314.0, 224.0, 100.0, 34.0, 10.0, 8.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.85332489013672, -39.42203903198242, -37.990753173828125, -36.55946350097656, -35.128177642822266, -33.69689178466797, -32.26560592651367, -30.834320068359375, -29.403032302856445, -27.97174644470215, -26.54045867919922, -25.109172821044922, -23.677886962890625, -22.246599197387695, -20.8153133392334, -19.38402557373047, -17.952739715576172, -16.521453857421875, -15.090166091918945, -13.658880233764648, -12.227593421936035, -10.796306610107422, -9.365020751953125, -7.933733940124512, -6.502447128295898, -5.071160316467285, -3.63987398147583, -2.208587646484375, -0.7773008346557617, 0.6539859771728516, 2.0852718353271484, 3.5165586471557617, 4.947845458984375, 6.379132270812988, 7.810418605804443, 9.241704940795898, 10.672991752624512, 12.104278564453125, 13.535564422607422, 14.966851234436035, 16.39813804626465, 17.829423904418945, 19.260711669921875, 20.691997528076172, 22.12328338623047, 23.5545711517334, 24.985857009887695, 26.417144775390625, 27.848430633544922, 29.27971649169922, 30.71100425720215, 32.14228820800781, 33.573577880859375, 35.00486373901367, 36.43614959716797, 37.867435455322266, 39.29872131347656, 40.73000717163086, 42.161293029785156, 43.59258270263672, 45.023868560791016, 46.45515441894531, 47.88644027709961, 49.317726135253906, 50.74901580810547]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 4.0, 2.0, 5.0, 10.0, 15.0, 12.0, 15.0, 24.0, 24.0, 24.0, 46.0, 30.0, 47.0, 55.0, 56.0, 48.0, 60.0, 62.0, 55.0, 58.0, 49.0, 47.0, 51.0, 33.0, 29.0, 32.0, 18.0, 25.0, 15.0, 13.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.802183151245117, -14.299299240112305, -13.796415328979492, -13.29353141784668, -12.790647506713867, -12.287763595581055, -11.784880638122559, -11.281996726989746, -10.779112815856934, -10.276228904724121, -9.773344993591309, -9.270461082458496, -8.767578125, -8.264694213867188, -7.761810302734375, -7.2589263916015625, -6.75604248046875, -6.2531585693359375, -5.750274658203125, -5.247391223907471, -4.744507312774658, -4.241623401641846, -3.7387397289276123, -3.235856056213379, -2.7329721450805664, -2.230088233947754, -1.7272045612335205, -1.2243207693099976, -0.7214369773864746, -0.2185530662536621, 0.2843306064605713, 0.7872142791748047, 1.29010009765625, 1.792983889579773, 2.295867681503296, 2.7987513542175293, 3.301635265350342, 3.8045191764831543, 4.307402610778809, 4.810286521911621, 5.313170433044434, 5.816054344177246, 6.318938255310059, 6.821821689605713, 7.324705600738525, 7.827589511871338, 8.330472946166992, 8.833356857299805, 9.336240768432617, 9.83912467956543, 10.342008590698242, 10.844892501831055, 11.347776412963867, 11.85066032409668, 12.353543281555176, 12.856427192687988, 13.3593111038208, 13.862195014953613, 14.365078926086426, 14.867962837219238, 15.370845794677734, 15.873729705810547, 16.37661361694336, 16.879497528076172, 17.382381439208984]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 15.0, 24.0, 47.0, 70.0, 130.0, 190.0, 298.0, 532.0, 945.0, 1740.0, 3162.0, 6097.0, 12525.0, 26576.0, 59283.0, 135082.0, 275526.0, 277093.0, 136126.0, 59832.0, 27211.0, 12598.0, 6323.0, 3127.0, 1728.0, 945.0, 535.0, 294.0, 180.0, 104.0, 59.0, 40.0, 36.0, 13.0, 8.0, 12.0, 9.0, 2.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.7691650390625, -1.710205078125, -1.6512451171875, -1.59228515625, -1.5333251953125, -1.474365234375, -1.4154052734375, -1.3564453125, -1.2974853515625, -1.238525390625, -1.1795654296875, -1.12060546875, -1.0616455078125, -1.002685546875, -0.9437255859375, -0.884765625, -0.8258056640625, -0.766845703125, -0.7078857421875, -0.64892578125, -0.5899658203125, -0.531005859375, -0.4720458984375, -0.4130859375, -0.3541259765625, -0.295166015625, -0.2362060546875, -0.17724609375, -0.1182861328125, -0.059326171875, -0.0003662109375, 0.05859375, 0.1175537109375, 0.176513671875, 0.2354736328125, 0.29443359375, 0.3533935546875, 0.412353515625, 0.4713134765625, 0.5302734375, 0.5892333984375, 0.648193359375, 0.7071533203125, 0.76611328125, 0.8250732421875, 0.884033203125, 0.9429931640625, 1.001953125, 1.0609130859375, 1.119873046875, 1.1788330078125, 1.23779296875, 1.2967529296875, 1.355712890625, 1.4146728515625, 1.4736328125, 1.5325927734375, 1.591552734375, 1.6505126953125, 1.70947265625, 1.7684326171875, 1.827392578125, 1.8863525390625, 1.9453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 15.0, 19.0, 25.0, 28.0, 31.0, 40.0, 52.0, 55.0, 65.0, 83.0, 62.0, 71.0, 75.0, 70.0, 49.0, 61.0, 38.0, 31.0, 30.0, 25.0, 24.0, 22.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.465087890625, -1.41455078125, -1.364013671875, -1.3134765625, -1.262939453125, -1.21240234375, -1.161865234375, -1.111328125, -1.060791015625, -1.01025390625, -0.959716796875, -0.9091796875, -0.858642578125, -0.80810546875, -0.757568359375, -0.70703125, -0.656494140625, -0.60595703125, -0.555419921875, -0.5048828125, -0.454345703125, -0.40380859375, -0.353271484375, -0.302734375, -0.252197265625, -0.20166015625, -0.151123046875, -0.1005859375, -0.050048828125, 0.00048828125, 0.051025390625, 0.1015625, 0.152099609375, 0.20263671875, 0.253173828125, 0.3037109375, 0.354248046875, 0.40478515625, 0.455322265625, 0.505859375, 0.556396484375, 0.60693359375, 0.657470703125, 0.7080078125, 0.758544921875, 0.80908203125, 0.859619140625, 0.91015625, 0.960693359375, 1.01123046875, 1.061767578125, 1.1123046875, 1.162841796875, 1.21337890625, 1.263916015625, 1.314453125, 1.364990234375, 1.41552734375, 1.466064453125, 1.5166015625, 1.567138671875, 1.61767578125, 1.668212890625, 1.71875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 14.0, 13.0, 25.0, 13.0, 32.0, 54.0, 62.0, 117.0, 136.0, 238.0, 430.0, 743.0, 1473.0, 3575.0, 11269.0, 45617.0, 236241.0, 583365.0, 126492.0, 26365.0, 7127.0, 2532.0, 1137.0, 589.0, 302.0, 187.0, 120.0, 71.0, 55.0, 31.0, 26.0, 14.0, 15.0, 13.0, 13.0, 3.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.62109375, -3.505462646484375, -3.38983154296875, -3.274200439453125, -3.1585693359375, -3.042938232421875, -2.92730712890625, -2.811676025390625, -2.696044921875, -2.580413818359375, -2.46478271484375, -2.349151611328125, -2.2335205078125, -2.117889404296875, -2.00225830078125, -1.886627197265625, -1.77099609375, -1.655364990234375, -1.53973388671875, -1.424102783203125, -1.3084716796875, -1.192840576171875, -1.07720947265625, -0.961578369140625, -0.845947265625, -0.730316162109375, -0.61468505859375, -0.499053955078125, -0.3834228515625, -0.267791748046875, -0.15216064453125, -0.036529541015625, 0.0791015625, 0.194732666015625, 0.31036376953125, 0.425994873046875, 0.5416259765625, 0.657257080078125, 0.77288818359375, 0.888519287109375, 1.004150390625, 1.119781494140625, 1.23541259765625, 1.351043701171875, 1.4666748046875, 1.582305908203125, 1.69793701171875, 1.813568115234375, 1.92919921875, 2.044830322265625, 2.16046142578125, 2.276092529296875, 2.3917236328125, 2.507354736328125, 2.62298583984375, 2.738616943359375, 2.854248046875, 2.969879150390625, 3.08551025390625, 3.201141357421875, 3.3167724609375, 3.432403564453125, 3.54803466796875, 3.663665771484375, 3.779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 4.0, 8.0, 13.0, 13.0, 16.0, 19.0, 23.0, 42.0, 25.0, 36.0, 44.0, 46.0, 52.0, 46.0, 52.0, 60.0, 52.0, 57.0, 53.0, 56.0, 40.0, 46.0, 39.0, 30.0, 27.0, 20.0, 12.0, 15.0, 13.0, 12.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.646484375, -4.48046875, -4.314453125, -4.1484375, -3.982421875, -3.81640625, -3.650390625, -3.484375, -3.318359375, -3.15234375, -2.986328125, -2.8203125, -2.654296875, -2.48828125, -2.322265625, -2.15625, -1.990234375, -1.82421875, -1.658203125, -1.4921875, -1.326171875, -1.16015625, -0.994140625, -0.828125, -0.662109375, -0.49609375, -0.330078125, -0.1640625, 0.001953125, 0.16796875, 0.333984375, 0.5, 0.666015625, 0.83203125, 0.998046875, 1.1640625, 1.330078125, 1.49609375, 1.662109375, 1.828125, 1.994140625, 2.16015625, 2.326171875, 2.4921875, 2.658203125, 2.82421875, 2.990234375, 3.15625, 3.322265625, 3.48828125, 3.654296875, 3.8203125, 3.986328125, 4.15234375, 4.318359375, 4.484375, 4.650390625, 4.81640625, 4.982421875, 5.1484375, 5.314453125, 5.48046875, 5.646484375, 5.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 6.0, 7.0, 28.0, 32.0, 42.0, 66.0, 128.0, 269.0, 565.0, 1528.0, 5034.0, 31448.0, 666628.0, 317664.0, 19111.0, 3725.0, 1185.0, 523.0, 210.0, 126.0, 72.0, 34.0, 32.0, 14.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.86468505859375, -2.7801513671875, -2.69561767578125, -2.611083984375, -2.52655029296875, -2.4420166015625, -2.35748291015625, -2.27294921875, -2.18841552734375, -2.1038818359375, -2.01934814453125, -1.934814453125, -1.85028076171875, -1.7657470703125, -1.68121337890625, -1.5966796875, -1.51214599609375, -1.4276123046875, -1.34307861328125, -1.258544921875, -1.17401123046875, -1.0894775390625, -1.00494384765625, -0.92041015625, -0.83587646484375, -0.7513427734375, -0.66680908203125, -0.582275390625, -0.49774169921875, -0.4132080078125, -0.32867431640625, -0.244140625, -0.15960693359375, -0.0750732421875, 0.00946044921875, 0.093994140625, 0.17852783203125, 0.2630615234375, 0.34759521484375, 0.43212890625, 0.51666259765625, 0.6011962890625, 0.68572998046875, 0.770263671875, 0.85479736328125, 0.9393310546875, 1.02386474609375, 1.1083984375, 1.19293212890625, 1.2774658203125, 1.36199951171875, 1.446533203125, 1.53106689453125, 1.6156005859375, 1.70013427734375, 1.78466796875, 1.86920166015625, 1.9537353515625, 2.03826904296875, 2.122802734375, 2.20733642578125, 2.2918701171875, 2.37640380859375, 2.4609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 3.0, 6.0, 13.0, 20.0, 19.0, 17.0, 61.0, 59.0, 75.0, 92.0, 106.0, 117.0, 94.0, 78.0, 59.0, 40.0, 44.0, 18.0, 14.0, 13.0, 7.0, 5.0, 11.0, 3.0, 3.0, 8.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00039124488830566406, -0.0003782697021961212, -0.00036529451608657837, -0.0003523193299770355, -0.0003393441438674927, -0.00032636895775794983, -0.000313393771648407, -0.00030041858553886414, -0.0002874433994293213, -0.00027446821331977844, -0.0002614930272102356, -0.00024851784110069275, -0.0002355426549911499, -0.00022256746888160706, -0.0002095922827720642, -0.00019661709666252136, -0.00018364191055297852, -0.00017066672444343567, -0.00015769153833389282, -0.00014471635222434998, -0.00013174116611480713, -0.00011876598000526428, -0.00010579079389572144, -9.281560778617859e-05, -7.984042167663574e-05, -6.68652355670929e-05, -5.389004945755005e-05, -4.09148633480072e-05, -2.7939677238464355e-05, -1.4964491128921509e-05, -1.989305019378662e-06, 1.0985881090164185e-05, 2.396106719970703e-05, 3.693625330924988e-05, 4.9911439418792725e-05, 6.288662552833557e-05, 7.586181163787842e-05, 8.883699774742126e-05, 0.00010181218385696411, 0.00011478736996650696, 0.0001277625560760498, 0.00014073774218559265, 0.0001537129282951355, 0.00016668811440467834, 0.0001796633005142212, 0.00019263848662376404, 0.00020561367273330688, 0.00021858885884284973, 0.00023156404495239258, 0.0002445392310619354, 0.00025751441717147827, 0.0002704896032810211, 0.00028346478939056396, 0.0002964399755001068, 0.00030941516160964966, 0.0003223903477191925, 0.00033536553382873535, 0.0003483407199382782, 0.00036131590604782104, 0.0003742910921573639, 0.00038726627826690674, 0.0004002414643764496, 0.00041321665048599243, 0.0004261918365955353, 0.0004391670227050781]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 16.0, 21.0, 30.0, 55.0, 75.0, 153.0, 271.0, 595.0, 1427.0, 4605.0, 24619.0, 282303.0, 668993.0, 54128.0, 7587.0, 2047.0, 814.0, 353.0, 162.0, 102.0, 67.0, 38.0, 22.0, 15.0, 11.0, 7.0, 6.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.115234375, -2.051483154296875, -1.98773193359375, -1.923980712890625, -1.8602294921875, -1.796478271484375, -1.73272705078125, -1.668975830078125, -1.605224609375, -1.541473388671875, -1.47772216796875, -1.413970947265625, -1.3502197265625, -1.286468505859375, -1.22271728515625, -1.158966064453125, -1.09521484375, -1.031463623046875, -0.96771240234375, -0.903961181640625, -0.8402099609375, -0.776458740234375, -0.71270751953125, -0.648956298828125, -0.585205078125, -0.521453857421875, -0.45770263671875, -0.393951416015625, -0.3302001953125, -0.266448974609375, -0.20269775390625, -0.138946533203125, -0.0751953125, -0.011444091796875, 0.05230712890625, 0.116058349609375, 0.1798095703125, 0.243560791015625, 0.30731201171875, 0.371063232421875, 0.434814453125, 0.498565673828125, 0.56231689453125, 0.626068115234375, 0.6898193359375, 0.753570556640625, 0.81732177734375, 0.881072998046875, 0.94482421875, 1.008575439453125, 1.07232666015625, 1.136077880859375, 1.1998291015625, 1.263580322265625, 1.32733154296875, 1.391082763671875, 1.454833984375, 1.518585205078125, 1.58233642578125, 1.646087646484375, 1.7098388671875, 1.773590087890625, 1.83734130859375, 1.901092529296875, 1.96484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 6.0, 6.0, 8.0, 21.0, 25.0, 26.0, 30.0, 37.0, 56.0, 61.0, 69.0, 79.0, 80.0, 88.0, 73.0, 80.0, 63.0, 45.0, 35.0, 26.0, 22.0, 18.0, 10.0, 13.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7666015625, -1.7126007080078125, -1.658599853515625, -1.6045989990234375, -1.55059814453125, -1.4965972900390625, -1.442596435546875, -1.3885955810546875, -1.3345947265625, -1.2805938720703125, -1.226593017578125, -1.1725921630859375, -1.11859130859375, -1.0645904541015625, -1.010589599609375, -0.9565887451171875, -0.902587890625, -0.8485870361328125, -0.794586181640625, -0.7405853271484375, -0.68658447265625, -0.6325836181640625, -0.578582763671875, -0.5245819091796875, -0.4705810546875, -0.4165802001953125, -0.362579345703125, -0.3085784912109375, -0.25457763671875, -0.2005767822265625, -0.146575927734375, -0.0925750732421875, -0.03857421875, 0.0154266357421875, 0.069427490234375, 0.1234283447265625, 0.17742919921875, 0.2314300537109375, 0.285430908203125, 0.3394317626953125, 0.3934326171875, 0.4474334716796875, 0.501434326171875, 0.5554351806640625, 0.60943603515625, 0.6634368896484375, 0.717437744140625, 0.7714385986328125, 0.825439453125, 0.8794403076171875, 0.933441162109375, 0.9874420166015625, 1.04144287109375, 1.0954437255859375, 1.149444580078125, 1.2034454345703125, 1.2574462890625, 1.3114471435546875, 1.365447998046875, 1.4194488525390625, 1.47344970703125, 1.5274505615234375, 1.581451416015625, 1.6354522705078125, 1.689453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 19.0, 45.0, 112.0, 216.0, 265.0, 172.0, 85.0, 35.0, 21.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.83061981201172, -35.3729133605957, -33.91520690917969, -32.45750427246094, -30.999797821044922, -29.542091369628906, -28.084386825561523, -26.62668228149414, -25.168975830078125, -23.71126937866211, -22.253564834594727, -20.795860290527344, -19.338153839111328, -17.880447387695312, -16.42274284362793, -14.96503734588623, -13.507331848144531, -12.049626350402832, -10.591920852661133, -9.134215354919434, -7.676509857177734, -6.218804359436035, -4.761098861694336, -3.3033933639526367, -1.8456878662109375, -0.3879823684692383, 1.069723129272461, 2.52742862701416, 3.9851341247558594, 5.442839622497559, 6.900545120239258, 8.358250617980957, 9.815959930419922, 11.273665428161621, 12.73137092590332, 14.18907642364502, 15.646781921386719, 17.104488372802734, 18.562192916870117, 20.0198974609375, 21.477603912353516, 22.93531036376953, 24.393014907836914, 25.850719451904297, 27.308425903320312, 28.766132354736328, 30.22383689880371, 31.681541442871094, 33.13924789428711, 34.596954345703125, 36.054656982421875, 37.51236343383789, 38.970069885253906, 40.42777633666992, 41.88548278808594, 43.34318542480469, 44.8008918762207, 46.25859832763672, 47.71630096435547, 49.174007415771484, 50.6317138671875, 52.089420318603516, 53.54712677001953, 55.00482940673828, 56.4625358581543]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 14.0, 14.0, 23.0, 30.0, 27.0, 32.0, 46.0, 43.0, 56.0, 50.0, 64.0, 79.0, 88.0, 75.0, 61.0, 52.0, 54.0, 33.0, 37.0, 30.0, 16.0, 14.0, 14.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.305660247802734, -35.44225311279297, -34.5788459777832, -33.71543502807617, -32.852027893066406, -31.98862075805664, -31.125213623046875, -30.261804580688477, -29.398395538330078, -28.534988403320312, -27.671579360961914, -26.80817222595215, -25.94476318359375, -25.081356048583984, -24.21794891357422, -23.35453987121582, -22.491132736206055, -21.62772560119629, -20.76431655883789, -19.900909423828125, -19.037500381469727, -18.17409324645996, -17.310684204101562, -16.447277069091797, -15.583868980407715, -14.720460891723633, -13.85705280303955, -12.993644714355469, -12.130237579345703, -11.266828536987305, -10.403421401977539, -9.540013313293457, -8.676603317260742, -7.81319522857666, -6.949787139892578, -6.086379528045654, -5.222971439361572, -4.35956335067749, -3.4961557388305664, -2.6327476501464844, -1.7693395614624023, -0.9059315919876099, -0.04252362251281738, 0.8208842277526855, 1.6842923164367676, 2.5477004051208496, 3.4111080169677734, 4.2745161056518555, 5.1379241943359375, 6.0013322830200195, 6.864740371704102, 7.728147983551025, 8.591556549072266, 9.454963684082031, 10.318371772766113, 11.181779861450195, 12.045187950134277, 12.90859603881836, 13.772004127502441, 14.635412216186523, 15.498819351196289, 16.362228393554688, 17.225635528564453, 18.08904266357422, 18.952451705932617]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 12.0, 16.0, 16.0, 25.0, 47.0, 47.0, 106.0, 224.0, 413.0, 902.0, 2046.0, 5131.0, 14957.0, 56694.0, 404992.0, 2827975.0, 760279.0, 86581.0, 21477.0, 7269.0, 2852.0, 1193.0, 525.0, 240.0, 112.0, 58.0, 38.0, 8.0, 15.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2734375, -2.216064453125, -2.15869140625, -2.101318359375, -2.0439453125, -1.986572265625, -1.92919921875, -1.871826171875, -1.814453125, -1.757080078125, -1.69970703125, -1.642333984375, -1.5849609375, -1.527587890625, -1.47021484375, -1.412841796875, -1.35546875, -1.298095703125, -1.24072265625, -1.183349609375, -1.1259765625, -1.068603515625, -1.01123046875, -0.953857421875, -0.896484375, -0.839111328125, -0.78173828125, -0.724365234375, -0.6669921875, -0.609619140625, -0.55224609375, -0.494873046875, -0.4375, -0.380126953125, -0.32275390625, -0.265380859375, -0.2080078125, -0.150634765625, -0.09326171875, -0.035888671875, 0.021484375, 0.078857421875, 0.13623046875, 0.193603515625, 0.2509765625, 0.308349609375, 0.36572265625, 0.423095703125, 0.48046875, 0.537841796875, 0.59521484375, 0.652587890625, 0.7099609375, 0.767333984375, 0.82470703125, 0.882080078125, 0.939453125, 0.996826171875, 1.05419921875, 1.111572265625, 1.1689453125, 1.226318359375, 1.28369140625, 1.341064453125, 1.3984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 19.0, 23.0, 34.0, 34.0, 66.0, 59.0, 97.0, 85.0, 89.0, 93.0, 99.0, 77.0, 74.0, 49.0, 41.0, 22.0, 20.0, 11.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.11328125, -3.0492782592773438, -2.9852752685546875, -2.9212722778320312, -2.857269287109375, -2.7932662963867188, -2.7292633056640625, -2.6652603149414062, -2.60125732421875, -2.5372543334960938, -2.4732513427734375, -2.4092483520507812, -2.345245361328125, -2.2812423706054688, -2.2172393798828125, -2.1532363891601562, -2.0892333984375, -2.0252304077148438, -1.9612274169921875, -1.8972244262695312, -1.833221435546875, -1.7692184448242188, -1.7052154541015625, -1.6412124633789062, -1.57720947265625, -1.5132064819335938, -1.4492034912109375, -1.3852005004882812, -1.321197509765625, -1.2571945190429688, -1.1931915283203125, -1.1291885375976562, -1.065185546875, -1.0011825561523438, -0.9371795654296875, -0.8731765747070312, -0.809173583984375, -0.7451705932617188, -0.6811676025390625, -0.6171646118164062, -0.55316162109375, -0.48915863037109375, -0.4251556396484375, -0.36115264892578125, -0.297149658203125, -0.23314666748046875, -0.1691436767578125, -0.10514068603515625, -0.0411376953125, 0.02286529541015625, 0.0868682861328125, 0.15087127685546875, 0.214874267578125, 0.27887725830078125, 0.3428802490234375, 0.40688323974609375, 0.47088623046875, 0.5348892211914062, 0.5988922119140625, 0.6628952026367188, 0.726898193359375, 0.7909011840820312, 0.8549041748046875, 0.9189071655273438, 0.98291015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 17.0, 12.0, 20.0, 24.0, 28.0, 54.0, 92.0, 156.0, 272.0, 488.0, 1014.0, 2345.0, 6415.0, 20541.0, 94655.0, 1299692.0, 2568616.0, 153942.0, 30748.0, 9033.0, 3234.0, 1338.0, 645.0, 337.0, 205.0, 110.0, 60.0, 46.0, 39.0, 31.0, 14.0, 15.0, 6.0, 6.0, 10.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.578125, -2.48956298828125, -2.4010009765625, -2.31243896484375, -2.223876953125, -2.13531494140625, -2.0467529296875, -1.95819091796875, -1.86962890625, -1.78106689453125, -1.6925048828125, -1.60394287109375, -1.515380859375, -1.42681884765625, -1.3382568359375, -1.24969482421875, -1.1611328125, -1.07257080078125, -0.9840087890625, -0.89544677734375, -0.806884765625, -0.71832275390625, -0.6297607421875, -0.54119873046875, -0.45263671875, -0.36407470703125, -0.2755126953125, -0.18695068359375, -0.098388671875, -0.00982666015625, 0.0787353515625, 0.16729736328125, 0.255859375, 0.34442138671875, 0.4329833984375, 0.52154541015625, 0.610107421875, 0.69866943359375, 0.7872314453125, 0.87579345703125, 0.96435546875, 1.05291748046875, 1.1414794921875, 1.23004150390625, 1.318603515625, 1.40716552734375, 1.4957275390625, 1.58428955078125, 1.6728515625, 1.76141357421875, 1.8499755859375, 1.93853759765625, 2.027099609375, 2.11566162109375, 2.2042236328125, 2.29278564453125, 2.38134765625, 2.46990966796875, 2.5584716796875, 2.64703369140625, 2.735595703125, 2.82415771484375, 2.9127197265625, 3.00128173828125, 3.08984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 2.0, 6.0, 5.0, 5.0, 8.0, 18.0, 20.0, 21.0, 34.0, 47.0, 64.0, 105.0, 206.0, 321.0, 553.0, 825.0, 678.0, 404.0, 246.0, 130.0, 97.0, 63.0, 61.0, 42.0, 25.0, 19.0, 17.0, 10.0, 11.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.2421875, -3.14324951171875, -3.0443115234375, -2.94537353515625, -2.846435546875, -2.74749755859375, -2.6485595703125, -2.54962158203125, -2.45068359375, -2.35174560546875, -2.2528076171875, -2.15386962890625, -2.054931640625, -1.95599365234375, -1.8570556640625, -1.75811767578125, -1.6591796875, -1.56024169921875, -1.4613037109375, -1.36236572265625, -1.263427734375, -1.16448974609375, -1.0655517578125, -0.96661376953125, -0.86767578125, -0.76873779296875, -0.6697998046875, -0.57086181640625, -0.471923828125, -0.37298583984375, -0.2740478515625, -0.17510986328125, -0.076171875, 0.02276611328125, 0.1217041015625, 0.22064208984375, 0.319580078125, 0.41851806640625, 0.5174560546875, 0.61639404296875, 0.71533203125, 0.81427001953125, 0.9132080078125, 1.01214599609375, 1.111083984375, 1.21002197265625, 1.3089599609375, 1.40789794921875, 1.5068359375, 1.60577392578125, 1.7047119140625, 1.80364990234375, 1.902587890625, 2.00152587890625, 2.1004638671875, 2.19940185546875, 2.29833984375, 2.39727783203125, 2.4962158203125, 2.59515380859375, 2.694091796875, 2.79302978515625, 2.8919677734375, 2.99090576171875, 3.08984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 17.0, 38.0, 90.0, 217.0, 273.0, 204.0, 87.0, 39.0, 16.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.38591766357422, -22.97064208984375, -21.55536651611328, -20.140090942382812, -18.724817276000977, -17.309541702270508, -15.894266128540039, -14.478991508483887, -13.063715934753418, -11.64844036102295, -10.233165740966797, -8.817890167236328, -7.402615070343018, -5.987339973449707, -4.572064399719238, -3.156789779663086, -1.7415142059326172, -0.3262389898300171, 1.089036226272583, 2.5043115615844727, 3.919586658477783, 5.334861755371094, 6.7501373291015625, 8.165411949157715, 9.580687522888184, 10.995963096618652, 12.411237716674805, 13.826513290405273, 15.241788864135742, 16.657062530517578, 18.072338104248047, 19.487613677978516, 20.902889251708984, 22.318164825439453, 23.733440399169922, 25.14871597290039, 26.563989639282227, 27.979265213012695, 29.394540786743164, 30.809814453125, 32.22509002685547, 33.64036560058594, 35.055641174316406, 36.470916748046875, 37.886192321777344, 39.30146789550781, 40.71674346923828, 42.132015228271484, 43.54729461669922, 44.96257019042969, 46.377845764160156, 47.793121337890625, 49.208396911621094, 50.62367248535156, 52.03894805908203, 53.454219818115234, 54.8694953918457, 56.28477096557617, 57.70004653930664, 59.11532211303711, 60.53059768676758, 61.94586944580078, 63.36114501953125, 64.77642059326172, 66.19169616699219]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 11.0, 12.0, 8.0, 21.0, 22.0, 25.0, 25.0, 32.0, 30.0, 26.0, 39.0, 46.0, 47.0, 43.0, 49.0, 47.0, 45.0, 63.0, 52.0, 41.0, 41.0, 30.0, 28.0, 24.0, 20.0, 30.0, 20.0, 21.0, 13.0, 21.0, 11.0, 6.0, 6.0, 10.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.254129409790039, -13.804848670959473, -13.355567932128906, -12.90628719329834, -12.457006454467773, -12.00772476196289, -11.558444023132324, -11.109163284301758, -10.659882545471191, -10.210601806640625, -9.761321067810059, -9.312040328979492, -8.86275863647461, -8.41347885131836, -7.964197158813477, -7.51491641998291, -7.065635681152344, -6.616354942321777, -6.167074203491211, -5.717792987823486, -5.26851224899292, -4.8192315101623535, -4.369950294494629, -3.9206695556640625, -3.471388816833496, -3.0221080780029297, -2.572827100753784, -2.1235461235046387, -1.6742653846740723, -1.2249846458435059, -0.7757036685943604, -0.32642269134521484, 0.12285804748535156, 0.5721389055252075, 1.0214197635650635, 1.4707006216049194, 1.9199814796447754, 2.369262218475342, 2.8185431957244873, 3.267824172973633, 3.717104911804199, 4.166385650634766, 4.615666389465332, 5.064947605133057, 5.514228343963623, 5.9635090827941895, 6.412790298461914, 6.8620710372924805, 7.311351776123047, 7.760632514953613, 8.20991325378418, 8.659193992614746, 9.108474731445312, 9.557756423950195, 10.007037162780762, 10.456317901611328, 10.905598640441895, 11.354879379272461, 11.804160118103027, 12.253440856933594, 12.702722549438477, 13.152002334594727, 13.60128402709961, 14.050564765930176, 14.499845504760742]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 12.0, 31.0, 28.0, 45.0, 71.0, 152.0, 261.0, 457.0, 965.0, 1932.0, 4115.0, 9190.0, 21442.0, 49233.0, 110050.0, 214552.0, 276413.0, 191381.0, 93646.0, 41402.0, 18134.0, 7990.0, 3547.0, 1696.0, 754.0, 443.0, 225.0, 142.0, 82.0, 44.0, 28.0, 30.0, 26.0, 10.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.8035430908203125, -1.752593994140625, -1.7016448974609375, -1.65069580078125, -1.5997467041015625, -1.548797607421875, -1.4978485107421875, -1.4468994140625, -1.3959503173828125, -1.345001220703125, -1.2940521240234375, -1.24310302734375, -1.1921539306640625, -1.141204833984375, -1.0902557373046875, -1.039306640625, -0.9883575439453125, -0.937408447265625, -0.8864593505859375, -0.83551025390625, -0.7845611572265625, -0.733612060546875, -0.6826629638671875, -0.6317138671875, -0.5807647705078125, -0.529815673828125, -0.4788665771484375, -0.42791748046875, -0.3769683837890625, -0.326019287109375, -0.2750701904296875, -0.22412109375, -0.1731719970703125, -0.122222900390625, -0.0712738037109375, -0.02032470703125, 0.0306243896484375, 0.081573486328125, 0.1325225830078125, 0.1834716796875, 0.2344207763671875, 0.285369873046875, 0.3363189697265625, 0.38726806640625, 0.4382171630859375, 0.489166259765625, 0.5401153564453125, 0.591064453125, 0.6420135498046875, 0.692962646484375, 0.7439117431640625, 0.79486083984375, 0.8458099365234375, 0.896759033203125, 0.9477081298828125, 0.9986572265625, 1.0496063232421875, 1.100555419921875, 1.1515045166015625, 1.20245361328125, 1.2534027099609375, 1.304351806640625, 1.3553009033203125, 1.40625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 9.0, 18.0, 10.0, 14.0, 27.0, 30.0, 32.0, 37.0, 55.0, 55.0, 54.0, 65.0, 61.0, 51.0, 42.0, 58.0, 52.0, 47.0, 51.0, 46.0, 30.0, 32.0, 34.0, 27.0, 18.0, 10.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7373046875, -1.6965789794921875, -1.655853271484375, -1.6151275634765625, -1.57440185546875, -1.5336761474609375, -1.492950439453125, -1.4522247314453125, -1.4114990234375, -1.3707733154296875, -1.330047607421875, -1.2893218994140625, -1.24859619140625, -1.2078704833984375, -1.167144775390625, -1.1264190673828125, -1.085693359375, -1.0449676513671875, -1.004241943359375, -0.9635162353515625, -0.92279052734375, -0.8820648193359375, -0.841339111328125, -0.8006134033203125, -0.7598876953125, -0.7191619873046875, -0.678436279296875, -0.6377105712890625, -0.59698486328125, -0.5562591552734375, -0.515533447265625, -0.4748077392578125, -0.43408203125, -0.3933563232421875, -0.352630615234375, -0.3119049072265625, -0.27117919921875, -0.2304534912109375, -0.189727783203125, -0.1490020751953125, -0.1082763671875, -0.0675506591796875, -0.026824951171875, 0.0139007568359375, 0.05462646484375, 0.0953521728515625, 0.136077880859375, 0.1768035888671875, 0.217529296875, 0.2582550048828125, 0.298980712890625, 0.3397064208984375, 0.38043212890625, 0.4211578369140625, 0.461883544921875, 0.5026092529296875, 0.5433349609375, 0.5840606689453125, 0.624786376953125, 0.6655120849609375, 0.70623779296875, 0.7469635009765625, 0.787689208984375, 0.8284149169921875, 0.869140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 13.0, 20.0, 21.0, 30.0, 42.0, 53.0, 85.0, 124.0, 199.0, 270.0, 449.0, 775.0, 1290.0, 2792.0, 8073.0, 41757.0, 310263.0, 591143.0, 71719.0, 11867.0, 3512.0, 1586.0, 879.0, 534.0, 357.0, 224.0, 141.0, 111.0, 60.0, 43.0, 37.0, 24.0, 16.0, 11.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.47265625, -4.355377197265625, -4.23809814453125, -4.120819091796875, -4.0035400390625, -3.886260986328125, -3.76898193359375, -3.651702880859375, -3.534423828125, -3.417144775390625, -3.29986572265625, -3.182586669921875, -3.0653076171875, -2.948028564453125, -2.83074951171875, -2.713470458984375, -2.59619140625, -2.478912353515625, -2.36163330078125, -2.244354248046875, -2.1270751953125, -2.009796142578125, -1.89251708984375, -1.775238037109375, -1.657958984375, -1.540679931640625, -1.42340087890625, -1.306121826171875, -1.1888427734375, -1.071563720703125, -0.95428466796875, -0.837005615234375, -0.7197265625, -0.602447509765625, -0.48516845703125, -0.367889404296875, -0.2506103515625, -0.133331298828125, -0.01605224609375, 0.101226806640625, 0.218505859375, 0.335784912109375, 0.45306396484375, 0.570343017578125, 0.6876220703125, 0.804901123046875, 0.92218017578125, 1.039459228515625, 1.15673828125, 1.274017333984375, 1.39129638671875, 1.508575439453125, 1.6258544921875, 1.743133544921875, 1.86041259765625, 1.977691650390625, 2.094970703125, 2.212249755859375, 2.32952880859375, 2.446807861328125, 2.5640869140625, 2.681365966796875, 2.79864501953125, 2.915924072265625, 3.033203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 11.0, 13.0, 26.0, 30.0, 35.0, 35.0, 37.0, 43.0, 52.0, 61.0, 67.0, 52.0, 87.0, 65.0, 61.0, 62.0, 45.0, 43.0, 31.0, 29.0, 25.0, 21.0, 24.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.54296875, -7.35833740234375, -7.1737060546875, -6.98907470703125, -6.804443359375, -6.61981201171875, -6.4351806640625, -6.25054931640625, -6.06591796875, -5.88128662109375, -5.6966552734375, -5.51202392578125, -5.327392578125, -5.14276123046875, -4.9581298828125, -4.77349853515625, -4.5888671875, -4.40423583984375, -4.2196044921875, -4.03497314453125, -3.850341796875, -3.66571044921875, -3.4810791015625, -3.29644775390625, -3.11181640625, -2.92718505859375, -2.7425537109375, -2.55792236328125, -2.373291015625, -2.18865966796875, -2.0040283203125, -1.81939697265625, -1.634765625, -1.45013427734375, -1.2655029296875, -1.08087158203125, -0.896240234375, -0.71160888671875, -0.5269775390625, -0.34234619140625, -0.15771484375, 0.02691650390625, 0.2115478515625, 0.39617919921875, 0.580810546875, 0.76544189453125, 0.9500732421875, 1.13470458984375, 1.3193359375, 1.50396728515625, 1.6885986328125, 1.87322998046875, 2.057861328125, 2.24249267578125, 2.4271240234375, 2.61175537109375, 2.79638671875, 2.98101806640625, 3.1656494140625, 3.35028076171875, 3.534912109375, 3.71954345703125, 3.9041748046875, 4.08880615234375, 4.2734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 16.0, 13.0, 31.0, 90.0, 168.0, 557.0, 2035.0, 19816.0, 876368.0, 142508.0, 5368.0, 1024.0, 313.0, 121.0, 52.0, 29.0, 15.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.957305908203125, -2.86968994140625, -2.782073974609375, -2.6944580078125, -2.606842041015625, -2.51922607421875, -2.431610107421875, -2.343994140625, -2.256378173828125, -2.16876220703125, -2.081146240234375, -1.9935302734375, -1.905914306640625, -1.81829833984375, -1.730682373046875, -1.64306640625, -1.555450439453125, -1.46783447265625, -1.380218505859375, -1.2926025390625, -1.204986572265625, -1.11737060546875, -1.029754638671875, -0.942138671875, -0.854522705078125, -0.76690673828125, -0.679290771484375, -0.5916748046875, -0.504058837890625, -0.41644287109375, -0.328826904296875, -0.2412109375, -0.153594970703125, -0.06597900390625, 0.021636962890625, 0.1092529296875, 0.196868896484375, 0.28448486328125, 0.372100830078125, 0.459716796875, 0.547332763671875, 0.63494873046875, 0.722564697265625, 0.8101806640625, 0.897796630859375, 0.98541259765625, 1.073028564453125, 1.16064453125, 1.248260498046875, 1.33587646484375, 1.423492431640625, 1.5111083984375, 1.598724365234375, 1.68634033203125, 1.773956298828125, 1.861572265625, 1.949188232421875, 2.03680419921875, 2.124420166015625, 2.2120361328125, 2.299652099609375, 2.38726806640625, 2.474884033203125, 2.5625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 2.0, 3.0, 13.0, 13.0, 10.0, 21.0, 19.0, 22.0, 28.0, 31.0, 47.0, 54.0, 52.0, 85.0, 67.0, 83.0, 90.0, 60.0, 50.0, 43.0, 46.0, 39.0, 30.0, 19.0, 13.0, 15.0, 9.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021457672119140625, -0.00020572543144226074, -0.00019687414169311523, -0.00018802285194396973, -0.00017917156219482422, -0.0001703202724456787, -0.0001614689826965332, -0.0001526176929473877, -0.0001437664031982422, -0.00013491511344909668, -0.00012606382369995117, -0.00011721253395080566, -0.00010836124420166016, -9.950995445251465e-05, -9.065866470336914e-05, -8.180737495422363e-05, -7.295608520507812e-05, -6.410479545593262e-05, -5.525350570678711e-05, -4.64022159576416e-05, -3.7550926208496094e-05, -2.8699636459350586e-05, -1.9848346710205078e-05, -1.099705696105957e-05, -2.1457672119140625e-06, 6.705522537231445e-06, 1.5556812286376953e-05, 2.440810203552246e-05, 3.325939178466797e-05, 4.2110681533813477e-05, 5.0961971282958984e-05, 5.981326103210449e-05, 6.866455078125e-05, 7.751584053039551e-05, 8.636713027954102e-05, 9.521842002868652e-05, 0.00010406970977783203, 0.00011292099952697754, 0.00012177228927612305, 0.00013062357902526855, 0.00013947486877441406, 0.00014832615852355957, 0.00015717744827270508, 0.00016602873802185059, 0.0001748800277709961, 0.0001837313175201416, 0.0001925826072692871, 0.00020143389701843262, 0.00021028518676757812, 0.00021913647651672363, 0.00022798776626586914, 0.00023683905601501465, 0.00024569034576416016, 0.00025454163551330566, 0.00026339292526245117, 0.0002722442150115967, 0.0002810955047607422, 0.0002899467945098877, 0.0002987980842590332, 0.0003076493740081787, 0.0003165006637573242, 0.0003253519535064697, 0.00033420324325561523, 0.00034305453300476074, 0.00035190582275390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 9.0, 9.0, 11.0, 21.0, 24.0, 49.0, 70.0, 85.0, 182.0, 265.0, 424.0, 777.0, 1589.0, 3690.0, 11771.0, 57742.0, 528702.0, 374913.0, 50672.0, 10681.0, 3495.0, 1510.0, 725.0, 404.0, 241.0, 148.0, 93.0, 61.0, 51.0, 30.0, 33.0, 14.0, 16.0, 12.0, 6.0, 5.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9940032958984375, -0.959686279296875, -0.9253692626953125, -0.89105224609375, -0.8567352294921875, -0.822418212890625, -0.7881011962890625, -0.7537841796875, -0.7194671630859375, -0.685150146484375, -0.6508331298828125, -0.61651611328125, -0.5821990966796875, -0.547882080078125, -0.5135650634765625, -0.479248046875, -0.4449310302734375, -0.410614013671875, -0.3762969970703125, -0.34197998046875, -0.3076629638671875, -0.273345947265625, -0.2390289306640625, -0.2047119140625, -0.1703948974609375, -0.136077880859375, -0.1017608642578125, -0.06744384765625, -0.0331268310546875, 0.001190185546875, 0.0355072021484375, 0.06982421875, 0.1041412353515625, 0.138458251953125, 0.1727752685546875, 0.20709228515625, 0.2414093017578125, 0.275726318359375, 0.3100433349609375, 0.3443603515625, 0.3786773681640625, 0.412994384765625, 0.4473114013671875, 0.48162841796875, 0.5159454345703125, 0.550262451171875, 0.5845794677734375, 0.618896484375, 0.6532135009765625, 0.687530517578125, 0.7218475341796875, 0.75616455078125, 0.7904815673828125, 0.824798583984375, 0.8591156005859375, 0.8934326171875, 0.9277496337890625, 0.962066650390625, 0.9963836669921875, 1.03070068359375, 1.0650177001953125, 1.099334716796875, 1.1336517333984375, 1.16796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 6.0, 12.0, 8.0, 12.0, 20.0, 20.0, 26.0, 31.0, 43.0, 37.0, 52.0, 61.0, 58.0, 75.0, 66.0, 56.0, 59.0, 49.0, 49.0, 45.0, 43.0, 39.0, 21.0, 28.0, 15.0, 16.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91015625, -0.8780517578125, -0.845947265625, -0.8138427734375, -0.78173828125, -0.7496337890625, -0.717529296875, -0.6854248046875, -0.6533203125, -0.6212158203125, -0.589111328125, -0.5570068359375, -0.52490234375, -0.4927978515625, -0.460693359375, -0.4285888671875, -0.396484375, -0.3643798828125, -0.332275390625, -0.3001708984375, -0.26806640625, -0.2359619140625, -0.203857421875, -0.1717529296875, -0.1396484375, -0.1075439453125, -0.075439453125, -0.0433349609375, -0.01123046875, 0.0208740234375, 0.052978515625, 0.0850830078125, 0.1171875, 0.1492919921875, 0.181396484375, 0.2135009765625, 0.24560546875, 0.2777099609375, 0.309814453125, 0.3419189453125, 0.3740234375, 0.4061279296875, 0.438232421875, 0.4703369140625, 0.50244140625, 0.5345458984375, 0.566650390625, 0.5987548828125, 0.630859375, 0.6629638671875, 0.695068359375, 0.7271728515625, 0.75927734375, 0.7913818359375, 0.823486328125, 0.8555908203125, 0.8876953125, 0.9197998046875, 0.951904296875, 0.9840087890625, 1.01611328125, 1.0482177734375, 1.080322265625, 1.1124267578125, 1.14453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 7.0, 16.0, 36.0, 57.0, 87.0, 119.0, 222.0, 169.0, 121.0, 74.0, 40.0, 21.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.81401824951172, -31.917997360229492, -31.021976470947266, -30.12595558166504, -29.229934692382812, -28.333913803100586, -27.43789291381836, -26.541872024536133, -25.645851135253906, -24.74983024597168, -23.853809356689453, -22.957788467407227, -22.061767578125, -21.165746688842773, -20.269725799560547, -19.37370491027832, -18.477684020996094, -17.581663131713867, -16.68564224243164, -15.789621353149414, -14.893600463867188, -13.997579574584961, -13.101558685302734, -12.205537796020508, -11.309516906738281, -10.413496017456055, -9.517475128173828, -8.621454238891602, -7.725433349609375, -6.829412460327148, -5.933391571044922, -5.037370681762695, -4.141349792480469, -3.245328903198242, -2.3493080139160156, -1.453287124633789, -0.5572662353515625, 0.33875465393066406, 1.2347755432128906, 2.130796432495117, 3.0268173217773438, 3.9228382110595703, 4.818859100341797, 5.714879989624023, 6.61090087890625, 7.506921768188477, 8.402942657470703, 9.29896354675293, 10.194984436035156, 11.091005325317383, 11.98702621459961, 12.883047103881836, 13.779067993164062, 14.675088882446289, 15.571109771728516, 16.467130661010742, 17.36315155029297, 18.259172439575195, 19.155193328857422, 20.05121421813965, 20.947235107421875, 21.8432559967041, 22.739276885986328, 23.635297775268555, 24.53131866455078]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 5.0, 8.0, 3.0, 12.0, 19.0, 25.0, 28.0, 22.0, 22.0, 28.0, 33.0, 37.0, 37.0, 43.0, 55.0, 63.0, 67.0, 64.0, 64.0, 46.0, 34.0, 36.0, 27.0, 26.0, 35.0, 19.0, 25.0, 14.0, 15.0, 16.0, 8.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.392358779907227, -16.842315673828125, -16.292272567749023, -15.742228507995605, -15.192185401916504, -14.642142295837402, -14.092098236083984, -13.542055130004883, -12.992012023925781, -12.44196891784668, -11.891925811767578, -11.34188175201416, -10.791838645935059, -10.241795539855957, -9.691751480102539, -9.141708374023438, -8.591665267944336, -8.041622161865234, -7.491578578948975, -6.941534996032715, -6.391491889953613, -5.841448783874512, -5.291405200958252, -4.741361618041992, -4.191318511962891, -3.64127516746521, -3.0912318229675293, -2.5411884784698486, -1.991145133972168, -1.4411017894744873, -0.8910584449768066, -0.341015100479126, 0.20902633666992188, 0.7590696811676025, 1.3091130256652832, 1.8591563701629639, 2.4091997146606445, 2.959243059158325, 3.509286403656006, 4.059329986572266, 4.609373092651367, 5.159416198730469, 5.7094597816467285, 6.259503364562988, 6.80954647064209, 7.359589576721191, 7.909633159637451, 8.459676742553711, 9.009719848632812, 9.559762954711914, 10.109806060791016, 10.659850120544434, 11.209893226623535, 11.759936332702637, 12.309980392456055, 12.860023498535156, 13.410066604614258, 13.96010971069336, 14.510152816772461, 15.060196876525879, 15.61023998260498, 16.1602840423584, 16.7103271484375, 17.2603702545166, 17.810413360595703]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 14.0, 19.0, 23.0, 24.0, 46.0, 60.0, 96.0, 179.0, 303.0, 519.0, 947.0, 1550.0, 2999.0, 5851.0, 11603.0, 26092.0, 67307.0, 224594.0, 862959.0, 1826528.0, 832502.0, 214093.0, 65896.0, 25592.0, 11738.0, 5784.0, 3055.0, 1640.0, 930.0, 580.0, 280.0, 178.0, 112.0, 67.0, 58.0, 19.0, 18.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0693359375, -1.0408096313476562, -1.0122833251953125, -0.9837570190429688, -0.955230712890625, -0.9267044067382812, -0.8981781005859375, -0.8696517944335938, -0.84112548828125, -0.8125991821289062, -0.7840728759765625, -0.7555465698242188, -0.727020263671875, -0.6984939575195312, -0.6699676513671875, -0.6414413452148438, -0.6129150390625, -0.5843887329101562, -0.5558624267578125, -0.5273361206054688, -0.498809814453125, -0.47028350830078125, -0.4417572021484375, -0.41323089599609375, -0.38470458984375, -0.35617828369140625, -0.3276519775390625, -0.29912567138671875, -0.270599365234375, -0.24207305908203125, -0.2135467529296875, -0.18502044677734375, -0.156494140625, -0.12796783447265625, -0.0994415283203125, -0.07091522216796875, -0.042388916015625, -0.01386260986328125, 0.0146636962890625, 0.04319000244140625, 0.07171630859375, 0.10024261474609375, 0.1287689208984375, 0.15729522705078125, 0.185821533203125, 0.21434783935546875, 0.2428741455078125, 0.27140045166015625, 0.2999267578125, 0.32845306396484375, 0.3569793701171875, 0.38550567626953125, 0.414031982421875, 0.44255828857421875, 0.4710845947265625, 0.49961090087890625, 0.52813720703125, 0.5566635131835938, 0.5851898193359375, 0.6137161254882812, 0.642242431640625, 0.6707687377929688, 0.6992950439453125, 0.7278213500976562, 0.75634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 7.0, 6.0, 8.0, 10.0, 11.0, 12.0, 12.0, 16.0, 15.0, 21.0, 29.0, 34.0, 38.0, 35.0, 38.0, 35.0, 40.0, 33.0, 49.0, 44.0, 41.0, 46.0, 30.0, 33.0, 45.0, 36.0, 38.0, 25.0, 30.0, 24.0, 16.0, 18.0, 9.0, 15.0, 15.0, 16.0, 10.0, 13.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8359375, -0.81036376953125, -0.7847900390625, -0.75921630859375, -0.733642578125, -0.70806884765625, -0.6824951171875, -0.65692138671875, -0.63134765625, -0.60577392578125, -0.5802001953125, -0.55462646484375, -0.529052734375, -0.50347900390625, -0.4779052734375, -0.45233154296875, -0.4267578125, -0.40118408203125, -0.3756103515625, -0.35003662109375, -0.324462890625, -0.29888916015625, -0.2733154296875, -0.24774169921875, -0.22216796875, -0.19659423828125, -0.1710205078125, -0.14544677734375, -0.119873046875, -0.09429931640625, -0.0687255859375, -0.04315185546875, -0.017578125, 0.00799560546875, 0.0335693359375, 0.05914306640625, 0.084716796875, 0.11029052734375, 0.1358642578125, 0.16143798828125, 0.18701171875, 0.21258544921875, 0.2381591796875, 0.26373291015625, 0.289306640625, 0.31488037109375, 0.3404541015625, 0.36602783203125, 0.3916015625, 0.41717529296875, 0.4427490234375, 0.46832275390625, 0.493896484375, 0.51947021484375, 0.5450439453125, 0.57061767578125, 0.59619140625, 0.62176513671875, 0.6473388671875, 0.67291259765625, 0.698486328125, 0.72406005859375, 0.7496337890625, 0.77520751953125, 0.80078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 6.0, 9.0, 15.0, 26.0, 22.0, 42.0, 38.0, 74.0, 116.0, 164.0, 327.0, 630.0, 1498.0, 4174.0, 13982.0, 58478.0, 435522.0, 3220498.0, 381593.0, 55331.0, 13750.0, 4434.0, 1747.0, 777.0, 414.0, 221.0, 133.0, 71.0, 60.0, 39.0, 26.0, 16.0, 10.0, 5.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.322998046875, -2.25146484375, -2.179931640625, -2.1083984375, -2.036865234375, -1.96533203125, -1.893798828125, -1.822265625, -1.750732421875, -1.67919921875, -1.607666015625, -1.5361328125, -1.464599609375, -1.39306640625, -1.321533203125, -1.25, -1.178466796875, -1.10693359375, -1.035400390625, -0.9638671875, -0.892333984375, -0.82080078125, -0.749267578125, -0.677734375, -0.606201171875, -0.53466796875, -0.463134765625, -0.3916015625, -0.320068359375, -0.24853515625, -0.177001953125, -0.10546875, -0.033935546875, 0.03759765625, 0.109130859375, 0.1806640625, 0.252197265625, 0.32373046875, 0.395263671875, 0.466796875, 0.538330078125, 0.60986328125, 0.681396484375, 0.7529296875, 0.824462890625, 0.89599609375, 0.967529296875, 1.0390625, 1.110595703125, 1.18212890625, 1.253662109375, 1.3251953125, 1.396728515625, 1.46826171875, 1.539794921875, 1.611328125, 1.682861328125, 1.75439453125, 1.825927734375, 1.8974609375, 1.968994140625, 2.04052734375, 2.112060546875, 2.18359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 18.0, 15.0, 25.0, 29.0, 36.0, 51.0, 103.0, 138.0, 269.0, 486.0, 668.0, 768.0, 536.0, 357.0, 166.0, 116.0, 80.0, 55.0, 36.0, 23.0, 15.0, 17.0, 14.0, 8.0, 6.0, 3.0, 2.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.5286865234375, -2.442138671875, -2.3555908203125, -2.26904296875, -2.1824951171875, -2.095947265625, -2.0093994140625, -1.9228515625, -1.8363037109375, -1.749755859375, -1.6632080078125, -1.57666015625, -1.4901123046875, -1.403564453125, -1.3170166015625, -1.23046875, -1.1439208984375, -1.057373046875, -0.9708251953125, -0.88427734375, -0.7977294921875, -0.711181640625, -0.6246337890625, -0.5380859375, -0.4515380859375, -0.364990234375, -0.2784423828125, -0.19189453125, -0.1053466796875, -0.018798828125, 0.0677490234375, 0.154296875, 0.2408447265625, 0.327392578125, 0.4139404296875, 0.50048828125, 0.5870361328125, 0.673583984375, 0.7601318359375, 0.8466796875, 0.9332275390625, 1.019775390625, 1.1063232421875, 1.19287109375, 1.2794189453125, 1.365966796875, 1.4525146484375, 1.5390625, 1.6256103515625, 1.712158203125, 1.7987060546875, 1.88525390625, 1.9718017578125, 2.058349609375, 2.1448974609375, 2.2314453125, 2.3179931640625, 2.404541015625, 2.4910888671875, 2.57763671875, 2.6641845703125, 2.750732421875, 2.8372802734375, 2.923828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 11.0, 35.0, 74.0, 259.0, 284.0, 220.0, 57.0, 26.0, 20.0, 2.0, 7.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.636878967285156, -43.29689025878906, -41.9568977355957, -40.616905212402344, -39.27691650390625, -37.936927795410156, -36.5969352722168, -35.25694274902344, -33.916954040527344, -32.57696533203125, -31.23697280883789, -29.896982192993164, -28.556991577148438, -27.21700096130371, -25.877010345458984, -24.537019729614258, -23.19702911376953, -21.857038497924805, -20.517047882080078, -19.17705726623535, -17.837066650390625, -16.4970760345459, -15.157085418701172, -13.817094802856445, -12.477104187011719, -11.137113571166992, -9.797122955322266, -8.457132339477539, -7.1171417236328125, -5.777151107788086, -4.437160491943359, -3.097169876098633, -1.7571754455566406, -0.41718482971191406, 0.9228057861328125, 2.262796401977539, 3.6027870178222656, 4.942777633666992, 6.282768249511719, 7.622758865356445, 8.962749481201172, 10.302740097045898, 11.642730712890625, 12.982721328735352, 14.322711944580078, 15.662702560424805, 17.00269317626953, 18.342683792114258, 19.682674407958984, 21.02266502380371, 22.362655639648438, 23.702646255493164, 25.04263687133789, 26.382627487182617, 27.722618103027344, 29.06260871887207, 30.402599334716797, 31.742589950561523, 33.08258056640625, 34.422569274902344, 35.7625617980957, 37.10255432128906, 38.442543029785156, 39.78253173828125, 41.12252426147461]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 10.0, 8.0, 8.0, 10.0, 13.0, 15.0, 18.0, 23.0, 27.0, 33.0, 38.0, 39.0, 55.0, 46.0, 54.0, 54.0, 64.0, 58.0, 58.0, 59.0, 46.0, 45.0, 40.0, 29.0, 29.0, 20.0, 21.0, 13.0, 10.0, 16.0, 7.0, 8.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.405157089233398, -10.970491409301758, -10.535825729370117, -10.101160049438477, -9.666494369506836, -9.231828689575195, -8.797163009643555, -8.362497329711914, -7.927831649780273, -7.493165969848633, -7.058500289916992, -6.623834609985352, -6.189168930053711, -5.75450325012207, -5.31983757019043, -4.885171890258789, -4.45050573348999, -4.01584005355835, -3.581174373626709, -3.1465086936950684, -2.7118430137634277, -2.277177095413208, -1.8425114154815674, -1.4078457355499268, -0.9731800556182861, -0.5385143756866455, -0.10384863615036011, 0.3308171033859253, 0.7654827833175659, 1.200148582458496, 1.6348142623901367, 2.0694799423217773, 2.504145622253418, 2.9388113021850586, 3.373476982116699, 3.80814266204834, 4.2428083419799805, 4.677474021911621, 5.112139701843262, 5.546805381774902, 5.981471061706543, 6.416136741638184, 6.850802421569824, 7.285468101501465, 7.7201337814331055, 8.154799461364746, 8.589465141296387, 9.024130821228027, 9.458797454833984, 9.893463134765625, 10.328128814697266, 10.762794494628906, 11.197460174560547, 11.632125854492188, 12.066791534423828, 12.501457214355469, 12.93612289428711, 13.37078857421875, 13.80545425415039, 14.240119934082031, 14.674785614013672, 15.109451293945312, 15.544116973876953, 15.978782653808594, 16.413448333740234]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 11.0, 17.0, 22.0, 41.0, 47.0, 86.0, 120.0, 200.0, 296.0, 450.0, 721.0, 1266.0, 2099.0, 3736.0, 6752.0, 12405.0, 23564.0, 44899.0, 85543.0, 155699.0, 230588.0, 208434.0, 126814.0, 67570.0, 35239.0, 18756.0, 9957.0, 5443.0, 3106.0, 1803.0, 1105.0, 606.0, 402.0, 261.0, 161.0, 105.0, 76.0, 44.0, 36.0, 20.0, 13.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.3134765625, -1.2708587646484375, -1.228240966796875, -1.1856231689453125, -1.14300537109375, -1.1003875732421875, -1.057769775390625, -1.0151519775390625, -0.9725341796875, -0.9299163818359375, -0.887298583984375, -0.8446807861328125, -0.80206298828125, -0.7594451904296875, -0.716827392578125, -0.6742095947265625, -0.631591796875, -0.5889739990234375, -0.546356201171875, -0.5037384033203125, -0.46112060546875, -0.4185028076171875, -0.375885009765625, -0.3332672119140625, -0.2906494140625, -0.2480316162109375, -0.205413818359375, -0.1627960205078125, -0.12017822265625, -0.0775604248046875, -0.034942626953125, 0.0076751708984375, 0.05029296875, 0.0929107666015625, 0.135528564453125, 0.1781463623046875, 0.22076416015625, 0.2633819580078125, 0.305999755859375, 0.3486175537109375, 0.3912353515625, 0.4338531494140625, 0.476470947265625, 0.5190887451171875, 0.56170654296875, 0.6043243408203125, 0.646942138671875, 0.6895599365234375, 0.732177734375, 0.7747955322265625, 0.817413330078125, 0.8600311279296875, 0.90264892578125, 0.9452667236328125, 0.987884521484375, 1.0305023193359375, 1.0731201171875, 1.1157379150390625, 1.158355712890625, 1.2009735107421875, 1.24359130859375, 1.2862091064453125, 1.328826904296875, 1.3714447021484375, 1.4140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 8.0, 9.0, 21.0, 19.0, 15.0, 26.0, 42.0, 39.0, 61.0, 69.0, 48.0, 61.0, 70.0, 59.0, 66.0, 54.0, 49.0, 55.0, 47.0, 36.0, 30.0, 31.0, 30.0, 15.0, 17.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.875, -1.8325729370117188, -1.7901458740234375, -1.7477188110351562, -1.705291748046875, -1.6628646850585938, -1.6204376220703125, -1.5780105590820312, -1.53558349609375, -1.4931564331054688, -1.4507293701171875, -1.4083023071289062, -1.365875244140625, -1.3234481811523438, -1.2810211181640625, -1.2385940551757812, -1.1961669921875, -1.1537399291992188, -1.1113128662109375, -1.0688858032226562, -1.026458740234375, -0.9840316772460938, -0.9416046142578125, -0.8991775512695312, -0.85675048828125, -0.8143234252929688, -0.7718963623046875, -0.7294692993164062, -0.687042236328125, -0.6446151733398438, -0.6021881103515625, -0.5597610473632812, -0.517333984375, -0.47490692138671875, -0.4324798583984375, -0.39005279541015625, -0.347625732421875, -0.30519866943359375, -0.2627716064453125, -0.22034454345703125, -0.17791748046875, -0.13549041748046875, -0.0930633544921875, -0.05063629150390625, -0.008209228515625, 0.03421783447265625, 0.0766448974609375, 0.11907196044921875, 0.1614990234375, 0.20392608642578125, 0.2463531494140625, 0.28878021240234375, 0.331207275390625, 0.37363433837890625, 0.4160614013671875, 0.45848846435546875, 0.50091552734375, 0.5433425903320312, 0.5857696533203125, 0.6281967163085938, 0.670623779296875, 0.7130508422851562, 0.7554779052734375, 0.7979049682617188, 0.84033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 23.0, 38.0, 43.0, 69.0, 100.0, 152.0, 238.0, 347.0, 548.0, 983.0, 2066.0, 5989.0, 26861.0, 182314.0, 683409.0, 117714.0, 18917.0, 4567.0, 1736.0, 864.0, 547.0, 318.0, 202.0, 147.0, 111.0, 67.0, 37.0, 41.0, 27.0, 24.0, 14.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.527923583984375, -4.40350341796875, -4.279083251953125, -4.1546630859375, -4.030242919921875, -3.90582275390625, -3.781402587890625, -3.656982421875, -3.532562255859375, -3.40814208984375, -3.283721923828125, -3.1593017578125, -3.034881591796875, -2.91046142578125, -2.786041259765625, -2.66162109375, -2.537200927734375, -2.41278076171875, -2.288360595703125, -2.1639404296875, -2.039520263671875, -1.91510009765625, -1.790679931640625, -1.666259765625, -1.541839599609375, -1.41741943359375, -1.292999267578125, -1.1685791015625, -1.044158935546875, -0.91973876953125, -0.795318603515625, -0.6708984375, -0.546478271484375, -0.42205810546875, -0.297637939453125, -0.1732177734375, -0.048797607421875, 0.07562255859375, 0.200042724609375, 0.324462890625, 0.448883056640625, 0.57330322265625, 0.697723388671875, 0.8221435546875, 0.946563720703125, 1.07098388671875, 1.195404052734375, 1.31982421875, 1.444244384765625, 1.56866455078125, 1.693084716796875, 1.8175048828125, 1.941925048828125, 2.06634521484375, 2.190765380859375, 2.315185546875, 2.439605712890625, 2.56402587890625, 2.688446044921875, 2.8128662109375, 2.937286376953125, 3.06170654296875, 3.186126708984375, 3.310546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 9.0, 11.0, 8.0, 16.0, 24.0, 16.0, 31.0, 33.0, 35.0, 41.0, 37.0, 42.0, 43.0, 43.0, 62.0, 51.0, 58.0, 46.0, 43.0, 39.0, 34.0, 36.0, 36.0, 32.0, 23.0, 15.0, 22.0, 21.0, 11.0, 16.0, 15.0, 10.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.75, -4.618988037109375, -4.48797607421875, -4.356964111328125, -4.2259521484375, -4.094940185546875, -3.96392822265625, -3.832916259765625, -3.701904296875, -3.570892333984375, -3.43988037109375, -3.308868408203125, -3.1778564453125, -3.046844482421875, -2.91583251953125, -2.784820556640625, -2.65380859375, -2.522796630859375, -2.39178466796875, -2.260772705078125, -2.1297607421875, -1.998748779296875, -1.86773681640625, -1.736724853515625, -1.605712890625, -1.474700927734375, -1.34368896484375, -1.212677001953125, -1.0816650390625, -0.950653076171875, -0.81964111328125, -0.688629150390625, -0.5576171875, -0.426605224609375, -0.29559326171875, -0.164581298828125, -0.0335693359375, 0.097442626953125, 0.22845458984375, 0.359466552734375, 0.490478515625, 0.621490478515625, 0.75250244140625, 0.883514404296875, 1.0145263671875, 1.145538330078125, 1.27655029296875, 1.407562255859375, 1.53857421875, 1.669586181640625, 1.80059814453125, 1.931610107421875, 2.0626220703125, 2.193634033203125, 2.32464599609375, 2.455657958984375, 2.586669921875, 2.717681884765625, 2.84869384765625, 2.979705810546875, 3.1107177734375, 3.241729736328125, 3.37274169921875, 3.503753662109375, 3.634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 12.0, 13.0, 14.0, 14.0, 36.0, 50.0, 91.0, 140.0, 234.0, 458.0, 993.0, 2229.0, 6090.0, 19832.0, 88664.0, 562350.0, 288725.0, 56948.0, 13766.0, 4508.0, 1714.0, 754.0, 366.0, 198.0, 125.0, 75.0, 38.0, 25.0, 24.0, 15.0, 17.0, 10.0, 10.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8346481323242188, -0.7996673583984375, -0.7646865844726562, -0.729705810546875, -0.6947250366210938, -0.6597442626953125, -0.6247634887695312, -0.58978271484375, -0.5548019409179688, -0.5198211669921875, -0.48484039306640625, -0.449859619140625, -0.41487884521484375, -0.3798980712890625, -0.34491729736328125, -0.3099365234375, -0.27495574951171875, -0.2399749755859375, -0.20499420166015625, -0.170013427734375, -0.13503265380859375, -0.1000518798828125, -0.06507110595703125, -0.03009033203125, 0.00489044189453125, 0.0398712158203125, 0.07485198974609375, 0.109832763671875, 0.14481353759765625, 0.1797943115234375, 0.21477508544921875, 0.249755859375, 0.28473663330078125, 0.3197174072265625, 0.35469818115234375, 0.389678955078125, 0.42465972900390625, 0.4596405029296875, 0.49462127685546875, 0.52960205078125, 0.5645828247070312, 0.5995635986328125, 0.6345443725585938, 0.669525146484375, 0.7045059204101562, 0.7394866943359375, 0.7744674682617188, 0.8094482421875, 0.8444290161132812, 0.8794097900390625, 0.9143905639648438, 0.949371337890625, 0.9843521118164062, 1.0193328857421875, 1.0543136596679688, 1.08929443359375, 1.1242752075195312, 1.1592559814453125, 1.1942367553710938, 1.229217529296875, 1.2641983032226562, 1.2991790771484375, 1.3341598510742188, 1.369140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 13.0, 9.0, 14.0, 12.0, 23.0, 23.0, 28.0, 47.0, 53.0, 77.0, 82.0, 89.0, 95.0, 77.0, 67.0, 44.0, 51.0, 46.0, 26.0, 29.0, 16.0, 23.0, 8.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031495094299316406, -0.00030369311571121216, -0.00029243528842926025, -0.00028117746114730835, -0.00026991963386535645, -0.00025866180658340454, -0.00024740397930145264, -0.00023614615201950073, -0.00022488832473754883, -0.00021363049745559692, -0.00020237267017364502, -0.00019111484289169312, -0.0001798570156097412, -0.0001685991883277893, -0.0001573413610458374, -0.0001460835337638855, -0.0001348257064819336, -0.0001235678791999817, -0.00011231005191802979, -0.00010105222463607788, -8.979439735412598e-05, -7.853657007217407e-05, -6.727874279022217e-05, -5.6020915508270264e-05, -4.476308822631836e-05, -3.3505260944366455e-05, -2.224743366241455e-05, -1.0989606380462646e-05, 2.682209014892578e-07, 1.1526048183441162e-05, 2.2783875465393066e-05, 3.404170274734497e-05, 4.5299530029296875e-05, 5.655735731124878e-05, 6.781518459320068e-05, 7.907301187515259e-05, 9.033083915710449e-05, 0.0001015886664390564, 0.0001128464937210083, 0.0001241043210029602, 0.0001353621482849121, 0.00014661997556686401, 0.00015787780284881592, 0.00016913563013076782, 0.00018039345741271973, 0.00019165128469467163, 0.00020290911197662354, 0.00021416693925857544, 0.00022542476654052734, 0.00023668259382247925, 0.00024794042110443115, 0.00025919824838638306, 0.00027045607566833496, 0.00028171390295028687, 0.00029297173023223877, 0.0003042295575141907, 0.0003154873847961426, 0.0003267452120780945, 0.0003380030393600464, 0.0003492608666419983, 0.0003605186939239502, 0.0003717765212059021, 0.000383034348487854, 0.0003942921757698059, 0.0004055500030517578]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 7.0, 17.0, 21.0, 26.0, 34.0, 45.0, 73.0, 146.0, 217.0, 444.0, 725.0, 1355.0, 3186.0, 8419.0, 30212.0, 150035.0, 621420.0, 180160.0, 35455.0, 9616.0, 3558.0, 1555.0, 745.0, 416.0, 249.0, 135.0, 88.0, 63.0, 31.0, 19.0, 18.0, 10.0, 16.0, 10.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0302734375, -0.998626708984375, -0.96697998046875, -0.935333251953125, -0.9036865234375, -0.872039794921875, -0.84039306640625, -0.808746337890625, -0.777099609375, -0.745452880859375, -0.71380615234375, -0.682159423828125, -0.6505126953125, -0.618865966796875, -0.58721923828125, -0.555572509765625, -0.52392578125, -0.492279052734375, -0.46063232421875, -0.428985595703125, -0.3973388671875, -0.365692138671875, -0.33404541015625, -0.302398681640625, -0.270751953125, -0.239105224609375, -0.20745849609375, -0.175811767578125, -0.1441650390625, -0.112518310546875, -0.08087158203125, -0.049224853515625, -0.017578125, 0.014068603515625, 0.04571533203125, 0.077362060546875, 0.1090087890625, 0.140655517578125, 0.17230224609375, 0.203948974609375, 0.235595703125, 0.267242431640625, 0.29888916015625, 0.330535888671875, 0.3621826171875, 0.393829345703125, 0.42547607421875, 0.457122802734375, 0.48876953125, 0.520416259765625, 0.55206298828125, 0.583709716796875, 0.6153564453125, 0.647003173828125, 0.67864990234375, 0.710296630859375, 0.741943359375, 0.773590087890625, 0.80523681640625, 0.836883544921875, 0.8685302734375, 0.900177001953125, 0.93182373046875, 0.963470458984375, 0.9951171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 10.0, 12.0, 15.0, 34.0, 46.0, 64.0, 63.0, 92.0, 108.0, 109.0, 101.0, 78.0, 79.0, 57.0, 39.0, 31.0, 21.0, 16.0, 12.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58203125, -1.533416748046875, -1.48480224609375, -1.436187744140625, -1.3875732421875, -1.338958740234375, -1.29034423828125, -1.241729736328125, -1.193115234375, -1.144500732421875, -1.09588623046875, -1.047271728515625, -0.9986572265625, -0.950042724609375, -0.90142822265625, -0.852813720703125, -0.80419921875, -0.755584716796875, -0.70697021484375, -0.658355712890625, -0.6097412109375, -0.561126708984375, -0.51251220703125, -0.463897705078125, -0.415283203125, -0.366668701171875, -0.31805419921875, -0.269439697265625, -0.2208251953125, -0.172210693359375, -0.12359619140625, -0.074981689453125, -0.0263671875, 0.022247314453125, 0.07086181640625, 0.119476318359375, 0.1680908203125, 0.216705322265625, 0.26531982421875, 0.313934326171875, 0.362548828125, 0.411163330078125, 0.45977783203125, 0.508392333984375, 0.5570068359375, 0.605621337890625, 0.65423583984375, 0.702850341796875, 0.75146484375, 0.800079345703125, 0.84869384765625, 0.897308349609375, 0.9459228515625, 0.994537353515625, 1.04315185546875, 1.091766357421875, 1.140380859375, 1.188995361328125, 1.23760986328125, 1.286224365234375, 1.3348388671875, 1.383453369140625, 1.43206787109375, 1.480682373046875, 1.529296875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 42.0, 178.0, 431.0, 220.0, 77.0, 23.0, 10.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.16886138916016, -67.41625213623047, -65.66364288330078, -63.91102981567383, -62.15842056274414, -60.40580749511719, -58.6531982421875, -56.90058898925781, -55.147979736328125, -53.39537048339844, -51.642757415771484, -49.8901481628418, -48.13753890991211, -46.384925842285156, -44.63231658935547, -42.87970733642578, -41.12709426879883, -39.37448501586914, -37.62187194824219, -35.8692626953125, -34.11665344238281, -32.364044189453125, -30.611431121826172, -28.858821868896484, -27.106210708618164, -25.353599548339844, -23.600990295410156, -21.848379135131836, -20.095767974853516, -18.343158721923828, -16.590547561645508, -14.837937355041504, -13.0853271484375, -11.332716941833496, -9.580106735229492, -7.827495574951172, -6.074885368347168, -4.322275161743164, -2.5696640014648438, -0.8170537948608398, 0.9355564117431641, 2.688166856765747, 4.44077730178833, 6.193387985229492, 7.945998191833496, 9.6986083984375, 11.45121955871582, 13.203829765319824, 14.956439971923828, 16.70905113220215, 18.461660385131836, 20.214271545410156, 21.966880798339844, 23.719491958618164, 25.472103118896484, 27.224712371826172, 28.977323532104492, 30.729934692382812, 32.4825439453125, 34.23515319824219, 35.98776626586914, 37.74037551879883, 39.49298858642578, 41.24559783935547, 42.998207092285156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 10.0, 8.0, 8.0, 10.0, 10.0, 7.0, 17.0, 19.0, 18.0, 33.0, 28.0, 25.0, 27.0, 35.0, 37.0, 38.0, 58.0, 66.0, 75.0, 67.0, 52.0, 41.0, 38.0, 37.0, 31.0, 35.0, 24.0, 22.0, 16.0, 17.0, 13.0, 9.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-16.460195541381836, -15.962446212768555, -15.46469783782959, -14.966948509216309, -14.469200134277344, -13.971450805664062, -13.473701477050781, -12.975953102111816, -12.478204727172852, -11.98045539855957, -11.482707023620605, -10.984957695007324, -10.48720932006836, -9.989459991455078, -9.491710662841797, -8.993962287902832, -8.49621295928955, -7.998464107513428, -7.500715255737305, -7.002965927124023, -6.505217552185059, -6.007468223571777, -5.509719371795654, -5.011970520019531, -4.514221668243408, -4.016472816467285, -3.518723964691162, -3.02097487449646, -2.523226022720337, -2.025477170944214, -1.5277280807495117, -1.0299792289733887, -0.5322303771972656, -0.0344814658164978, 0.46326744556427, 0.9610164165496826, 1.4587652683258057, 1.9565141201019287, 2.454263210296631, 2.952012062072754, 3.449760913848877, 3.947509765625, 4.445258617401123, 4.943007469177246, 5.440756797790527, 5.938505172729492, 6.436254501342773, 6.9340033531188965, 7.4317522048950195, 7.929501056671143, 8.427249908447266, 8.924999237060547, 9.422747611999512, 9.920496940612793, 10.418245315551758, 10.915994644165039, 11.41374397277832, 11.911493301391602, 12.409241676330566, 12.906991004943848, 13.404739379882812, 13.902488708496094, 14.400238037109375, 14.89798641204834, 15.395734786987305]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 10.0, 17.0, 22.0, 27.0, 39.0, 64.0, 67.0, 119.0, 181.0, 291.0, 538.0, 1126.0, 2732.0, 7454.0, 27860.0, 167471.0, 1375864.0, 2209801.0, 334879.0, 47436.0, 11390.0, 3616.0, 1487.0, 721.0, 386.0, 210.0, 112.0, 103.0, 53.0, 37.0, 37.0, 26.0, 25.0, 21.0, 12.0, 11.0, 3.0, 8.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.350189208984375, -1.30389404296875, -1.257598876953125, -1.2113037109375, -1.165008544921875, -1.11871337890625, -1.072418212890625, -1.026123046875, -0.979827880859375, -0.93353271484375, -0.887237548828125, -0.8409423828125, -0.794647216796875, -0.74835205078125, -0.702056884765625, -0.65576171875, -0.609466552734375, -0.56317138671875, -0.516876220703125, -0.4705810546875, -0.424285888671875, -0.37799072265625, -0.331695556640625, -0.285400390625, -0.239105224609375, -0.19281005859375, -0.146514892578125, -0.1002197265625, -0.053924560546875, -0.00762939453125, 0.038665771484375, 0.0849609375, 0.131256103515625, 0.17755126953125, 0.223846435546875, 0.2701416015625, 0.316436767578125, 0.36273193359375, 0.409027099609375, 0.455322265625, 0.501617431640625, 0.54791259765625, 0.594207763671875, 0.6405029296875, 0.686798095703125, 0.73309326171875, 0.779388427734375, 0.82568359375, 0.871978759765625, 0.91827392578125, 0.964569091796875, 1.0108642578125, 1.057159423828125, 1.10345458984375, 1.149749755859375, 1.196044921875, 1.242340087890625, 1.28863525390625, 1.334930419921875, 1.3812255859375, 1.427520751953125, 1.47381591796875, 1.520111083984375, 1.56640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 9.0, 10.0, 11.0, 11.0, 19.0, 26.0, 31.0, 26.0, 35.0, 33.0, 39.0, 40.0, 40.0, 37.0, 45.0, 52.0, 43.0, 46.0, 42.0, 39.0, 33.0, 43.0, 44.0, 39.0, 28.0, 24.0, 19.0, 16.0, 22.0, 19.0, 12.0, 11.0, 9.0, 5.0, 7.0, 2.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.978515625, -0.95013427734375, -0.9217529296875, -0.89337158203125, -0.864990234375, -0.83660888671875, -0.8082275390625, -0.77984619140625, -0.75146484375, -0.72308349609375, -0.6947021484375, -0.66632080078125, -0.637939453125, -0.60955810546875, -0.5811767578125, -0.55279541015625, -0.5244140625, -0.49603271484375, -0.4676513671875, -0.43927001953125, -0.410888671875, -0.38250732421875, -0.3541259765625, -0.32574462890625, -0.29736328125, -0.26898193359375, -0.2406005859375, -0.21221923828125, -0.183837890625, -0.15545654296875, -0.1270751953125, -0.09869384765625, -0.0703125, -0.04193115234375, -0.0135498046875, 0.01483154296875, 0.043212890625, 0.07159423828125, 0.0999755859375, 0.12835693359375, 0.15673828125, 0.18511962890625, 0.2135009765625, 0.24188232421875, 0.270263671875, 0.29864501953125, 0.3270263671875, 0.35540771484375, 0.3837890625, 0.41217041015625, 0.4405517578125, 0.46893310546875, 0.497314453125, 0.52569580078125, 0.5540771484375, 0.58245849609375, 0.61083984375, 0.63922119140625, 0.6676025390625, 0.69598388671875, 0.724365234375, 0.75274658203125, 0.7811279296875, 0.80950927734375, 0.837890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 17.0, 34.0, 81.0, 115.0, 283.0, 670.0, 2470.0, 22823.0, 3594306.0, 561182.0, 9383.0, 1703.0, 633.0, 279.0, 126.0, 77.0, 44.0, 18.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.27001953125, -6.0791015625, -5.88818359375, -5.697265625, -5.50634765625, -5.3154296875, -5.12451171875, -4.93359375, -4.74267578125, -4.5517578125, -4.36083984375, -4.169921875, -3.97900390625, -3.7880859375, -3.59716796875, -3.40625, -3.21533203125, -3.0244140625, -2.83349609375, -2.642578125, -2.45166015625, -2.2607421875, -2.06982421875, -1.87890625, -1.68798828125, -1.4970703125, -1.30615234375, -1.115234375, -0.92431640625, -0.7333984375, -0.54248046875, -0.3515625, -0.16064453125, 0.0302734375, 0.22119140625, 0.412109375, 0.60302734375, 0.7939453125, 0.98486328125, 1.17578125, 1.36669921875, 1.5576171875, 1.74853515625, 1.939453125, 2.13037109375, 2.3212890625, 2.51220703125, 2.703125, 2.89404296875, 3.0849609375, 3.27587890625, 3.466796875, 3.65771484375, 3.8486328125, 4.03955078125, 4.23046875, 4.42138671875, 4.6123046875, 4.80322265625, 4.994140625, 5.18505859375, 5.3759765625, 5.56689453125, 5.7578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 16.0, 34.0, 50.0, 98.0, 218.0, 524.0, 1061.0, 1029.0, 544.0, 225.0, 111.0, 59.0, 31.0, 13.0, 11.0, 9.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.93280029296875, -2.7991943359375, -2.66558837890625, -2.531982421875, -2.39837646484375, -2.2647705078125, -2.13116455078125, -1.99755859375, -1.86395263671875, -1.7303466796875, -1.59674072265625, -1.463134765625, -1.32952880859375, -1.1959228515625, -1.06231689453125, -0.9287109375, -0.79510498046875, -0.6614990234375, -0.52789306640625, -0.394287109375, -0.26068115234375, -0.1270751953125, 0.00653076171875, 0.14013671875, 0.27374267578125, 0.4073486328125, 0.54095458984375, 0.674560546875, 0.80816650390625, 0.9417724609375, 1.07537841796875, 1.208984375, 1.34259033203125, 1.4761962890625, 1.60980224609375, 1.743408203125, 1.87701416015625, 2.0106201171875, 2.14422607421875, 2.27783203125, 2.41143798828125, 2.5450439453125, 2.67864990234375, 2.812255859375, 2.94586181640625, 3.0794677734375, 3.21307373046875, 3.3466796875, 3.48028564453125, 3.6138916015625, 3.74749755859375, 3.881103515625, 4.01470947265625, 4.1483154296875, 4.28192138671875, 4.41552734375, 4.54913330078125, 4.6827392578125, 4.81634521484375, 4.949951171875, 5.08355712890625, 5.2171630859375, 5.35076904296875, 5.484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 12.0, 45.0, 103.0, 221.0, 259.0, 200.0, 87.0, 34.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.412261962890625, -32.137489318847656, -30.862712860107422, -29.58793830871582, -28.31316375732422, -27.03839111328125, -25.76361656188965, -24.488842010498047, -23.214067459106445, -21.939292907714844, -20.664518356323242, -19.38974380493164, -18.114971160888672, -16.840194702148438, -15.565422058105469, -14.290647506713867, -13.015872955322266, -11.741098403930664, -10.466323852539062, -9.191550254821777, -7.916775703430176, -6.642001152038574, -5.367227077484131, -4.0924530029296875, -2.817678451538086, -1.5429041385650635, -0.268129825592041, 1.0066444873809814, 2.281418800354004, 3.5561933517456055, 4.830967426300049, 6.105741500854492, 7.380516052246094, 8.655290603637695, 9.930065155029297, 11.204838752746582, 12.479613304138184, 13.754387855529785, 15.02916145324707, 16.303936004638672, 17.578710556030273, 18.853485107421875, 20.128259658813477, 21.403034210205078, 22.677806854248047, 23.95258331298828, 25.22735595703125, 26.50213050842285, 27.776905059814453, 29.051679611206055, 30.326454162597656, 31.601228713989258, 32.87600326538086, 34.15077590942383, 35.42555236816406, 36.70032501220703, 37.97509765625, 39.24987030029297, 40.5246467590332, 41.79941940307617, 43.074195861816406, 44.348968505859375, 45.62374496459961, 46.89851760864258, 48.17329406738281]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 4.0, 10.0, 6.0, 8.0, 17.0, 16.0, 15.0, 28.0, 44.0, 38.0, 39.0, 34.0, 49.0, 44.0, 59.0, 49.0, 51.0, 62.0, 53.0, 36.0, 37.0, 38.0, 37.0, 28.0, 31.0, 33.0, 30.0, 28.0, 12.0, 14.0, 8.0, 7.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-19.158945083618164, -18.691299438476562, -18.223655700683594, -17.756010055541992, -17.28836441040039, -16.820720672607422, -16.35307502746582, -15.885429382324219, -15.417784690856934, -14.950139999389648, -14.482494354248047, -14.014849662780762, -13.54720401763916, -13.079559326171875, -12.611913681030273, -12.144268989562988, -11.676624298095703, -11.208979606628418, -10.741333961486816, -10.273689270019531, -9.80604362487793, -9.338398933410645, -8.87075424194336, -8.403108596801758, -7.935462951660156, -7.467817783355713, -7.0001726150512695, -6.532527923583984, -6.064882755279541, -5.597237586975098, -5.129592418670654, -4.661947250366211, -4.194302558898926, -3.7266573905944824, -3.259012460708618, -2.791367292404175, -2.3237223625183105, -1.8560771942138672, -1.3884320259094238, -0.9207870960235596, -0.4531419277191162, 0.014503151178359985, 0.4821482300758362, 0.9497933387756348, 1.4174383878707886, 1.8850834369659424, 2.3527286052703857, 2.82037353515625, 3.2880187034606934, 3.7556638717651367, 4.22330904006958, 4.690954208374023, 5.158598899841309, 5.626244068145752, 6.093889236450195, 6.5615339279174805, 7.029179573059082, 7.496824741363525, 7.964469909667969, 8.432114601135254, 8.899760246276855, 9.36740493774414, 9.835050582885742, 10.302695274353027, 10.770339965820312]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 4.0, 11.0, 17.0, 30.0, 49.0, 66.0, 106.0, 178.0, 272.0, 429.0, 700.0, 1180.0, 2054.0, 3451.0, 6181.0, 11094.0, 20851.0, 40623.0, 77849.0, 139837.0, 209286.0, 212577.0, 146584.0, 82073.0, 43111.0, 22495.0, 12027.0, 6441.0, 3629.0, 2088.0, 1279.0, 765.0, 440.0, 289.0, 190.0, 104.0, 69.0, 44.0, 34.0, 15.0, 9.0, 12.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3310546875, -1.2930755615234375, -1.255096435546875, -1.2171173095703125, -1.17913818359375, -1.1411590576171875, -1.103179931640625, -1.0652008056640625, -1.0272216796875, -0.9892425537109375, -0.951263427734375, -0.9132843017578125, -0.87530517578125, -0.8373260498046875, -0.799346923828125, -0.7613677978515625, -0.723388671875, -0.6854095458984375, -0.647430419921875, -0.6094512939453125, -0.57147216796875, -0.5334930419921875, -0.495513916015625, -0.4575347900390625, -0.4195556640625, -0.3815765380859375, -0.343597412109375, -0.3056182861328125, -0.26763916015625, -0.2296600341796875, -0.191680908203125, -0.1537017822265625, -0.11572265625, -0.0777435302734375, -0.039764404296875, -0.0017852783203125, 0.03619384765625, 0.0741729736328125, 0.112152099609375, 0.1501312255859375, 0.1881103515625, 0.2260894775390625, 0.264068603515625, 0.3020477294921875, 0.34002685546875, 0.3780059814453125, 0.415985107421875, 0.4539642333984375, 0.491943359375, 0.5299224853515625, 0.567901611328125, 0.6058807373046875, 0.64385986328125, 0.6818389892578125, 0.719818115234375, 0.7577972412109375, 0.7957763671875, 0.8337554931640625, 0.871734619140625, 0.9097137451171875, 0.94769287109375, 0.9856719970703125, 1.023651123046875, 1.0616302490234375, 1.099609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 9.0, 12.0, 18.0, 13.0, 18.0, 21.0, 20.0, 32.0, 20.0, 23.0, 39.0, 25.0, 39.0, 33.0, 39.0, 37.0, 46.0, 42.0, 51.0, 44.0, 41.0, 42.0, 34.0, 36.0, 32.0, 25.0, 30.0, 21.0, 23.0, 15.0, 18.0, 12.0, 7.0, 15.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.875, -0.8453826904296875, -0.815765380859375, -0.7861480712890625, -0.75653076171875, -0.7269134521484375, -0.697296142578125, -0.6676788330078125, -0.6380615234375, -0.6084442138671875, -0.578826904296875, -0.5492095947265625, -0.51959228515625, -0.4899749755859375, -0.460357666015625, -0.4307403564453125, -0.401123046875, -0.3715057373046875, -0.341888427734375, -0.3122711181640625, -0.28265380859375, -0.2530364990234375, -0.223419189453125, -0.1938018798828125, -0.1641845703125, -0.1345672607421875, -0.104949951171875, -0.0753326416015625, -0.04571533203125, -0.0160980224609375, 0.013519287109375, 0.0431365966796875, 0.07275390625, 0.1023712158203125, 0.131988525390625, 0.1616058349609375, 0.19122314453125, 0.2208404541015625, 0.250457763671875, 0.2800750732421875, 0.3096923828125, 0.3393096923828125, 0.368927001953125, 0.3985443115234375, 0.42816162109375, 0.4577789306640625, 0.487396240234375, 0.5170135498046875, 0.546630859375, 0.5762481689453125, 0.605865478515625, 0.6354827880859375, 0.66510009765625, 0.6947174072265625, 0.724334716796875, 0.7539520263671875, 0.7835693359375, 0.8131866455078125, 0.842803955078125, 0.8724212646484375, 0.90203857421875, 0.9316558837890625, 0.961273193359375, 0.9908905029296875, 1.0205078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 6.0, 13.0, 17.0, 20.0, 26.0, 50.0, 66.0, 98.0, 162.0, 250.0, 542.0, 1159.0, 2776.0, 8227.0, 30427.0, 142338.0, 600271.0, 201791.0, 43146.0, 10742.0, 3499.0, 1400.0, 653.0, 359.0, 157.0, 103.0, 68.0, 47.0, 27.0, 28.0, 20.0, 16.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.31640625, -3.225830078125, -3.13525390625, -3.044677734375, -2.9541015625, -2.863525390625, -2.77294921875, -2.682373046875, -2.591796875, -2.501220703125, -2.41064453125, -2.320068359375, -2.2294921875, -2.138916015625, -2.04833984375, -1.957763671875, -1.8671875, -1.776611328125, -1.68603515625, -1.595458984375, -1.5048828125, -1.414306640625, -1.32373046875, -1.233154296875, -1.142578125, -1.052001953125, -0.96142578125, -0.870849609375, -0.7802734375, -0.689697265625, -0.59912109375, -0.508544921875, -0.41796875, -0.327392578125, -0.23681640625, -0.146240234375, -0.0556640625, 0.034912109375, 0.12548828125, 0.216064453125, 0.306640625, 0.397216796875, 0.48779296875, 0.578369140625, 0.6689453125, 0.759521484375, 0.85009765625, 0.940673828125, 1.03125, 1.121826171875, 1.21240234375, 1.302978515625, 1.3935546875, 1.484130859375, 1.57470703125, 1.665283203125, 1.755859375, 1.846435546875, 1.93701171875, 2.027587890625, 2.1181640625, 2.208740234375, 2.29931640625, 2.389892578125, 2.48046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 13.0, 6.0, 7.0, 14.0, 12.0, 18.0, 21.0, 23.0, 29.0, 25.0, 34.0, 37.0, 38.0, 44.0, 49.0, 45.0, 54.0, 59.0, 59.0, 54.0, 51.0, 43.0, 38.0, 40.0, 36.0, 22.0, 18.0, 15.0, 18.0, 10.0, 12.0, 10.0, 8.0, 8.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01953125, -3.89141845703125, -3.7633056640625, -3.63519287109375, -3.507080078125, -3.37896728515625, -3.2508544921875, -3.12274169921875, -2.99462890625, -2.86651611328125, -2.7384033203125, -2.61029052734375, -2.482177734375, -2.35406494140625, -2.2259521484375, -2.09783935546875, -1.9697265625, -1.84161376953125, -1.7135009765625, -1.58538818359375, -1.457275390625, -1.32916259765625, -1.2010498046875, -1.07293701171875, -0.94482421875, -0.81671142578125, -0.6885986328125, -0.56048583984375, -0.432373046875, -0.30426025390625, -0.1761474609375, -0.04803466796875, 0.080078125, 0.20819091796875, 0.3363037109375, 0.46441650390625, 0.592529296875, 0.72064208984375, 0.8487548828125, 0.97686767578125, 1.10498046875, 1.23309326171875, 1.3612060546875, 1.48931884765625, 1.617431640625, 1.74554443359375, 1.8736572265625, 2.00177001953125, 2.1298828125, 2.25799560546875, 2.3861083984375, 2.51422119140625, 2.642333984375, 2.77044677734375, 2.8985595703125, 3.02667236328125, 3.15478515625, 3.28289794921875, 3.4110107421875, 3.53912353515625, 3.667236328125, 3.79534912109375, 3.9234619140625, 4.05157470703125, 4.1796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 10.0, 13.0, 19.0, 22.0, 22.0, 36.0, 44.0, 75.0, 111.0, 174.0, 306.0, 434.0, 778.0, 1471.0, 3102.0, 7457.0, 23093.0, 100536.0, 620508.0, 223931.0, 44608.0, 12501.0, 4582.0, 2033.0, 1070.0, 616.0, 320.0, 218.0, 141.0, 85.0, 70.0, 40.0, 37.0, 17.0, 20.0, 15.0, 12.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0], "bins": [-1.2744140625, -1.2387542724609375, -1.203094482421875, -1.1674346923828125, -1.13177490234375, -1.0961151123046875, -1.060455322265625, -1.0247955322265625, -0.9891357421875, -0.9534759521484375, -0.917816162109375, -0.8821563720703125, -0.84649658203125, -0.8108367919921875, -0.775177001953125, -0.7395172119140625, -0.703857421875, -0.6681976318359375, -0.632537841796875, -0.5968780517578125, -0.56121826171875, -0.5255584716796875, -0.489898681640625, -0.4542388916015625, -0.4185791015625, -0.3829193115234375, -0.347259521484375, -0.3115997314453125, -0.27593994140625, -0.2402801513671875, -0.204620361328125, -0.1689605712890625, -0.13330078125, -0.0976409912109375, -0.061981201171875, -0.0263214111328125, 0.00933837890625, 0.0449981689453125, 0.080657958984375, 0.1163177490234375, 0.1519775390625, 0.1876373291015625, 0.223297119140625, 0.2589569091796875, 0.29461669921875, 0.3302764892578125, 0.365936279296875, 0.4015960693359375, 0.437255859375, 0.4729156494140625, 0.508575439453125, 0.5442352294921875, 0.57989501953125, 0.6155548095703125, 0.651214599609375, 0.6868743896484375, 0.7225341796875, 0.7581939697265625, 0.793853759765625, 0.8295135498046875, 0.86517333984375, 0.9008331298828125, 0.936492919921875, 0.9721527099609375, 1.0078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 35.0, 99.0, 186.0, 288.0, 174.0, 101.0, 39.0, 23.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009074211120605469, -0.0008755847811698914, -0.0008437484502792358, -0.0008119121193885803, -0.0007800757884979248, -0.0007482394576072693, -0.0007164031267166138, -0.0006845667958259583, -0.0006527304649353027, -0.0006208941340446472, -0.0005890578031539917, -0.0005572214722633362, -0.0005253851413726807, -0.0004935488104820251, -0.00046171247959136963, -0.0004298761487007141, -0.0003980398178100586, -0.0003662034869194031, -0.00033436715602874756, -0.00030253082513809204, -0.0002706944942474365, -0.000238858163356781, -0.0002070218324661255, -0.00017518550157546997, -0.00014334917068481445, -0.00011151283979415894, -7.967650890350342e-05, -4.78401780128479e-05, -1.6003847122192383e-05, 1.5832483768463135e-05, 4.766881465911865e-05, 7.950514554977417e-05, 0.00011134147644042969, 0.0001431778073310852, 0.00017501413822174072, 0.00020685046911239624, 0.00023868680000305176, 0.0002705231308937073, 0.0003023594617843628, 0.0003341957926750183, 0.00036603212356567383, 0.00039786845445632935, 0.00042970478534698486, 0.0004615411162376404, 0.0004933774471282959, 0.0005252137780189514, 0.0005570501089096069, 0.0005888864398002625, 0.000620722770690918, 0.0006525591015815735, 0.000684395432472229, 0.0007162317633628845, 0.00074806809425354, 0.0007799044251441956, 0.0008117407560348511, 0.0008435770869255066, 0.0008754134178161621, 0.0009072497487068176, 0.0009390860795974731, 0.0009709224104881287, 0.0010027587413787842, 0.0010345950722694397, 0.0010664314031600952, 0.0010982677340507507, 0.0011301040649414062]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 12.0, 13.0, 7.0, 21.0, 38.0, 61.0, 113.0, 259.0, 637.0, 1681.0, 5895.0, 25898.0, 172151.0, 710633.0, 106804.0, 17611.0, 4286.0, 1466.0, 489.0, 202.0, 120.0, 57.0, 49.0, 20.0, 11.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.1434326171875, -1.098388671875, -1.0533447265625, -1.00830078125, -0.9632568359375, -0.918212890625, -0.8731689453125, -0.828125, -0.7830810546875, -0.738037109375, -0.6929931640625, -0.64794921875, -0.6029052734375, -0.557861328125, -0.5128173828125, -0.4677734375, -0.4227294921875, -0.377685546875, -0.3326416015625, -0.28759765625, -0.2425537109375, -0.197509765625, -0.1524658203125, -0.107421875, -0.0623779296875, -0.017333984375, 0.0277099609375, 0.07275390625, 0.1177978515625, 0.162841796875, 0.2078857421875, 0.2529296875, 0.2979736328125, 0.343017578125, 0.3880615234375, 0.43310546875, 0.4781494140625, 0.523193359375, 0.5682373046875, 0.61328125, 0.6583251953125, 0.703369140625, 0.7484130859375, 0.79345703125, 0.8385009765625, 0.883544921875, 0.9285888671875, 0.9736328125, 1.0186767578125, 1.063720703125, 1.1087646484375, 1.15380859375, 1.1988525390625, 1.243896484375, 1.2889404296875, 1.333984375, 1.3790283203125, 1.424072265625, 1.4691162109375, 1.51416015625, 1.5592041015625, 1.604248046875, 1.6492919921875, 1.6943359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 8.0, 10.0, 13.0, 18.0, 17.0, 24.0, 25.0, 31.0, 33.0, 38.0, 58.0, 56.0, 66.0, 67.0, 78.0, 58.0, 60.0, 52.0, 51.0, 41.0, 27.0, 34.0, 12.0, 17.0, 18.0, 15.0, 8.0, 5.0, 10.0, 12.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.90252685546875, -0.8734130859375, -0.84429931640625, -0.815185546875, -0.78607177734375, -0.7569580078125, -0.72784423828125, -0.69873046875, -0.66961669921875, -0.6405029296875, -0.61138916015625, -0.582275390625, -0.55316162109375, -0.5240478515625, -0.49493408203125, -0.4658203125, -0.43670654296875, -0.4075927734375, -0.37847900390625, -0.349365234375, -0.32025146484375, -0.2911376953125, -0.26202392578125, -0.23291015625, -0.20379638671875, -0.1746826171875, -0.14556884765625, -0.116455078125, -0.08734130859375, -0.0582275390625, -0.02911376953125, 0.0, 0.02911376953125, 0.0582275390625, 0.08734130859375, 0.116455078125, 0.14556884765625, 0.1746826171875, 0.20379638671875, 0.23291015625, 0.26202392578125, 0.2911376953125, 0.32025146484375, 0.349365234375, 0.37847900390625, 0.4075927734375, 0.43670654296875, 0.4658203125, 0.49493408203125, 0.5240478515625, 0.55316162109375, 0.582275390625, 0.61138916015625, 0.6405029296875, 0.66961669921875, 0.69873046875, 0.72784423828125, 0.7569580078125, 0.78607177734375, 0.815185546875, 0.84429931640625, 0.8734130859375, 0.90252685546875, 0.931640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 17.0, 16.0, 26.0, 43.0, 74.0, 97.0, 129.0, 197.0, 112.0, 97.0, 58.0, 37.0, 27.0, 15.0, 12.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.30418586730957, -17.682147979736328, -17.06011199951172, -16.438074111938477, -15.816036224365234, -15.193998336791992, -14.571961402893066, -13.94992446899414, -13.327886581420898, -12.705848693847656, -12.08381175994873, -11.461774826049805, -10.839736938476562, -10.21769905090332, -9.595662117004395, -8.973625183105469, -8.351587295532227, -7.729549884796143, -7.107512474060059, -6.485475063323975, -5.863437652587891, -5.241400241851807, -4.619362831115723, -3.9973254203796387, -3.3752880096435547, -2.7532505989074707, -2.1312131881713867, -1.5091757774353027, -0.8871383666992188, -0.26510095596313477, 0.3569364547729492, 0.9789738655090332, 1.6010093688964844, 2.2230467796325684, 2.8450841903686523, 3.4671216011047363, 4.08915901184082, 4.711196422576904, 5.333233833312988, 5.955271244049072, 6.577308654785156, 7.19934606552124, 7.821383476257324, 8.44342041015625, 9.065458297729492, 9.687496185302734, 10.30953311920166, 10.931570053100586, 11.553607940673828, 12.17564582824707, 12.797682762145996, 13.419719696044922, 14.041757583618164, 14.663795471191406, 15.285832405090332, 15.907869338989258, 16.5299072265625, 17.151945114135742, 17.773983001708984, 18.396018981933594, 19.018056869506836, 19.640094757080078, 20.262130737304688, 20.88416862487793, 21.506206512451172]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 10.0, 10.0, 21.0, 15.0, 25.0, 22.0, 29.0, 28.0, 37.0, 33.0, 40.0, 55.0, 79.0, 97.0, 81.0, 40.0, 42.0, 40.0, 30.0, 23.0, 38.0, 29.0, 25.0, 19.0, 18.0, 20.0, 14.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.516998291015625, -17.951467514038086, -17.38593864440918, -16.82040786743164, -16.254878997802734, -15.689349174499512, -15.123819351196289, -14.55828857421875, -13.992759704589844, -13.427229881286621, -12.861700057983398, -12.296170234680176, -11.730640411376953, -11.16511058807373, -10.599580764770508, -10.034049987792969, -9.468520164489746, -8.902990341186523, -8.3374605178833, -7.771930694580078, -7.2064008712768555, -6.640871047973633, -6.075340747833252, -5.509810924530029, -4.944281101226807, -4.378751277923584, -3.8132214546203613, -3.2476913928985596, -2.682161569595337, -2.1166317462921143, -1.5511016845703125, -0.9855718612670898, -0.4200420379638672, 0.14548784494400024, 0.7110177278518677, 1.2765476703643799, 1.8420774936676025, 2.407607316970825, 2.973137378692627, 3.5386672019958496, 4.104197025299072, 4.669726848602295, 5.235256671905518, 5.800786972045898, 6.366316795349121, 6.931846618652344, 7.497376441955566, 8.062906265258789, 8.628436088562012, 9.193965911865234, 9.759495735168457, 10.32502555847168, 10.890555381774902, 11.456085205078125, 12.021615982055664, 12.58714485168457, 13.15267562866211, 13.718205451965332, 14.283735275268555, 14.849265098571777, 15.414794921875, 15.980324745178223, 16.545854568481445, 17.111385345458984, 17.67691421508789]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 4.0, 8.0, 15.0, 20.0, 36.0, 25.0, 51.0, 58.0, 79.0, 109.0, 158.0, 269.0, 363.0, 610.0, 1241.0, 2592.0, 5983.0, 16297.0, 59048.0, 281817.0, 1331996.0, 1869728.0, 490907.0, 93293.0, 24114.0, 8203.0, 3449.0, 1567.0, 832.0, 455.0, 289.0, 167.0, 143.0, 95.0, 60.0, 50.0, 30.0, 36.0, 12.0, 15.0, 13.0, 7.0, 7.0, 2.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.2255859375, -1.1874847412109375, -1.149383544921875, -1.1112823486328125, -1.07318115234375, -1.0350799560546875, -0.996978759765625, -0.9588775634765625, -0.9207763671875, -0.8826751708984375, -0.844573974609375, -0.8064727783203125, -0.76837158203125, -0.7302703857421875, -0.692169189453125, -0.6540679931640625, -0.615966796875, -0.5778656005859375, -0.539764404296875, -0.5016632080078125, -0.46356201171875, -0.4254608154296875, -0.387359619140625, -0.3492584228515625, -0.3111572265625, -0.2730560302734375, -0.234954833984375, -0.1968536376953125, -0.15875244140625, -0.1206512451171875, -0.082550048828125, -0.0444488525390625, -0.00634765625, 0.0317535400390625, 0.069854736328125, 0.1079559326171875, 0.14605712890625, 0.1841583251953125, 0.222259521484375, 0.2603607177734375, 0.2984619140625, 0.3365631103515625, 0.374664306640625, 0.4127655029296875, 0.45086669921875, 0.4889678955078125, 0.527069091796875, 0.5651702880859375, 0.603271484375, 0.6413726806640625, 0.679473876953125, 0.7175750732421875, 0.75567626953125, 0.7937774658203125, 0.831878662109375, 0.8699798583984375, 0.9080810546875, 0.9461822509765625, 0.984283447265625, 1.0223846435546875, 1.06048583984375, 1.0985870361328125, 1.136688232421875, 1.1747894287109375, 1.212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 6.0, 5.0, 9.0, 19.0, 16.0, 22.0, 29.0, 33.0, 37.0, 30.0, 41.0, 42.0, 46.0, 56.0, 48.0, 59.0, 56.0, 47.0, 54.0, 40.0, 39.0, 38.0, 33.0, 30.0, 31.0, 29.0, 21.0, 17.0, 16.0, 11.0, 10.0, 11.0, 3.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.068084716796875, -1.03265380859375, -0.997222900390625, -0.9617919921875, -0.926361083984375, -0.89093017578125, -0.855499267578125, -0.820068359375, -0.784637451171875, -0.74920654296875, -0.713775634765625, -0.6783447265625, -0.642913818359375, -0.60748291015625, -0.572052001953125, -0.53662109375, -0.501190185546875, -0.46575927734375, -0.430328369140625, -0.3948974609375, -0.359466552734375, -0.32403564453125, -0.288604736328125, -0.253173828125, -0.217742919921875, -0.18231201171875, -0.146881103515625, -0.1114501953125, -0.076019287109375, -0.04058837890625, -0.005157470703125, 0.0302734375, 0.065704345703125, 0.10113525390625, 0.136566162109375, 0.1719970703125, 0.207427978515625, 0.24285888671875, 0.278289794921875, 0.313720703125, 0.349151611328125, 0.38458251953125, 0.420013427734375, 0.4554443359375, 0.490875244140625, 0.52630615234375, 0.561737060546875, 0.59716796875, 0.632598876953125, 0.66802978515625, 0.703460693359375, 0.7388916015625, 0.774322509765625, 0.80975341796875, 0.845184326171875, 0.880615234375, 0.916046142578125, 0.95147705078125, 0.986907958984375, 1.0223388671875, 1.057769775390625, 1.09320068359375, 1.128631591796875, 1.1640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 13.0, 20.0, 30.0, 38.0, 63.0, 98.0, 179.0, 365.0, 915.0, 2550.0, 11657.0, 127069.0, 3563651.0, 458596.0, 22868.0, 3929.0, 1195.0, 450.0, 244.0, 109.0, 76.0, 41.0, 34.0, 25.0, 11.0, 14.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6328125, -3.521636962890625, -3.41046142578125, -3.299285888671875, -3.1881103515625, -3.076934814453125, -2.96575927734375, -2.854583740234375, -2.743408203125, -2.632232666015625, -2.52105712890625, -2.409881591796875, -2.2987060546875, -2.187530517578125, -2.07635498046875, -1.965179443359375, -1.85400390625, -1.742828369140625, -1.63165283203125, -1.520477294921875, -1.4093017578125, -1.298126220703125, -1.18695068359375, -1.075775146484375, -0.964599609375, -0.853424072265625, -0.74224853515625, -0.631072998046875, -0.5198974609375, -0.408721923828125, -0.29754638671875, -0.186370849609375, -0.0751953125, 0.035980224609375, 0.14715576171875, 0.258331298828125, 0.3695068359375, 0.480682373046875, 0.59185791015625, 0.703033447265625, 0.814208984375, 0.925384521484375, 1.03656005859375, 1.147735595703125, 1.2589111328125, 1.370086669921875, 1.48126220703125, 1.592437744140625, 1.70361328125, 1.814788818359375, 1.92596435546875, 2.037139892578125, 2.1483154296875, 2.259490966796875, 2.37066650390625, 2.481842041015625, 2.593017578125, 2.704193115234375, 2.81536865234375, 2.926544189453125, 3.0377197265625, 3.148895263671875, 3.26007080078125, 3.371246337890625, 3.482421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 7.0, 15.0, 16.0, 26.0, 38.0, 38.0, 38.0, 67.0, 99.0, 129.0, 208.0, 270.0, 448.0, 493.0, 593.0, 482.0, 367.0, 228.0, 149.0, 103.0, 76.0, 35.0, 38.0, 24.0, 15.0, 18.0, 13.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.041015625, -1.973297119140625, -1.90557861328125, -1.837860107421875, -1.7701416015625, -1.702423095703125, -1.63470458984375, -1.566986083984375, -1.499267578125, -1.431549072265625, -1.36383056640625, -1.296112060546875, -1.2283935546875, -1.160675048828125, -1.09295654296875, -1.025238037109375, -0.95751953125, -0.889801025390625, -0.82208251953125, -0.754364013671875, -0.6866455078125, -0.618927001953125, -0.55120849609375, -0.483489990234375, -0.415771484375, -0.348052978515625, -0.28033447265625, -0.212615966796875, -0.1448974609375, -0.077178955078125, -0.00946044921875, 0.058258056640625, 0.1259765625, 0.193695068359375, 0.26141357421875, 0.329132080078125, 0.3968505859375, 0.464569091796875, 0.53228759765625, 0.600006103515625, 0.667724609375, 0.735443115234375, 0.80316162109375, 0.870880126953125, 0.9385986328125, 1.006317138671875, 1.07403564453125, 1.141754150390625, 1.20947265625, 1.277191162109375, 1.34490966796875, 1.412628173828125, 1.4803466796875, 1.548065185546875, 1.61578369140625, 1.683502197265625, 1.751220703125, 1.818939208984375, 1.88665771484375, 1.954376220703125, 2.0220947265625, 2.089813232421875, 2.15753173828125, 2.225250244140625, 2.29296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 12.0, 22.0, 32.0, 57.0, 87.0, 153.0, 145.0, 165.0, 118.0, 93.0, 42.0, 33.0, 19.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.616308212280273, -24.925312042236328, -24.234315872192383, -23.543319702148438, -22.852325439453125, -22.16132926940918, -21.470333099365234, -20.77933692932129, -20.088340759277344, -19.3973445892334, -18.706348419189453, -18.01535415649414, -17.324357986450195, -16.63336181640625, -15.942365646362305, -15.25136947631836, -14.560375213623047, -13.869379043579102, -13.178383827209473, -12.487387657165527, -11.796392440795898, -11.105396270751953, -10.414400100708008, -9.723403930664062, -9.032408714294434, -8.341412544250488, -7.650417327880859, -6.959421157836914, -6.268425464630127, -5.57742977142334, -4.8864336013793945, -4.195437908172607, -3.504444122314453, -2.813448429107666, -2.1224524974823, -1.4314565658569336, -0.7404608726501465, -0.049465179443359375, 0.6415309906005859, 1.332526683807373, 2.02352237701416, 2.7145180702209473, 3.4055140018463135, 4.09650993347168, 4.787505626678467, 5.478501319885254, 6.169497489929199, 6.860493183135986, 7.551488876342773, 8.242485046386719, 8.933480262756348, 9.624476432800293, 10.315471649169922, 11.006467819213867, 11.697463989257812, 12.388460159301758, 13.079455375671387, 13.770451545715332, 14.461446762084961, 15.152442932128906, 15.843439102172852, 16.534435272216797, 17.22542953491211, 17.916425704956055, 18.607421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 11.0, 9.0, 17.0, 11.0, 16.0, 16.0, 22.0, 30.0, 28.0, 27.0, 43.0, 44.0, 48.0, 39.0, 59.0, 40.0, 51.0, 59.0, 38.0, 49.0, 40.0, 37.0, 44.0, 27.0, 30.0, 32.0, 22.0, 22.0, 14.0, 16.0, 11.0, 5.0, 8.0, 5.0, 3.0, 8.0, 1.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.094172477722168, -9.75648021697998, -9.418787956237793, -9.081095695495605, -8.743402481079102, -8.405710220336914, -8.068017959594727, -7.730325698852539, -7.392633438110352, -7.054941177368164, -6.717248916625977, -6.379556179046631, -6.041863918304443, -5.704171657562256, -5.36647891998291, -5.028786659240723, -4.691094398498535, -4.353402137756348, -4.01570987701416, -3.6780171394348145, -3.340324878692627, -3.0026326179504395, -2.664940118789673, -2.3272476196289062, -1.9895553588867188, -1.6518629789352417, -1.3141705989837646, -0.9764782190322876, -0.6387858390808105, -0.3010934591293335, 0.036598920822143555, 0.37429141998291016, 0.7119836807250977, 1.0496760606765747, 1.3873684406280518, 1.7250608205795288, 2.062753200531006, 2.4004454612731934, 2.73813796043396, 3.0758304595947266, 3.413522720336914, 3.7512149810791016, 4.088907241821289, 4.426599979400635, 4.764292240142822, 5.10198450088501, 5.4396772384643555, 5.777369499206543, 6.1150617599487305, 6.452754020690918, 6.7904462814331055, 7.128139019012451, 7.465831279754639, 7.803523540496826, 8.141216278076172, 8.47890853881836, 8.816600799560547, 9.154293060302734, 9.491985321044922, 9.82967758178711, 10.167369842529297, 10.5050630569458, 10.842755317687988, 11.180447578430176, 11.518139839172363]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 16.0, 31.0, 34.0, 45.0, 63.0, 96.0, 148.0, 257.0, 421.0, 681.0, 1236.0, 2188.0, 3830.0, 7380.0, 14065.0, 26180.0, 50202.0, 94722.0, 169900.0, 238702.0, 195963.0, 113703.0, 60517.0, 31773.0, 16495.0, 8736.0, 4844.0, 2580.0, 1449.0, 876.0, 536.0, 305.0, 182.0, 107.0, 78.0, 58.0, 41.0, 28.0, 13.0, 14.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1259765625, -1.0879974365234375, -1.050018310546875, -1.0120391845703125, -0.97406005859375, -0.9360809326171875, -0.898101806640625, -0.8601226806640625, -0.8221435546875, -0.7841644287109375, -0.746185302734375, -0.7082061767578125, -0.67022705078125, -0.6322479248046875, -0.594268798828125, -0.5562896728515625, -0.518310546875, -0.4803314208984375, -0.442352294921875, -0.4043731689453125, -0.36639404296875, -0.3284149169921875, -0.290435791015625, -0.2524566650390625, -0.2144775390625, -0.1764984130859375, -0.138519287109375, -0.1005401611328125, -0.06256103515625, -0.0245819091796875, 0.013397216796875, 0.0513763427734375, 0.08935546875, 0.1273345947265625, 0.165313720703125, 0.2032928466796875, 0.24127197265625, 0.2792510986328125, 0.317230224609375, 0.3552093505859375, 0.3931884765625, 0.4311676025390625, 0.469146728515625, 0.5071258544921875, 0.54510498046875, 0.5830841064453125, 0.621063232421875, 0.6590423583984375, 0.697021484375, 0.7350006103515625, 0.772979736328125, 0.8109588623046875, 0.84893798828125, 0.8869171142578125, 0.924896240234375, 0.9628753662109375, 1.0008544921875, 1.0388336181640625, 1.076812744140625, 1.1147918701171875, 1.15277099609375, 1.1907501220703125, 1.228729248046875, 1.2667083740234375, 1.3046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 10.0, 10.0, 8.0, 16.0, 22.0, 24.0, 24.0, 37.0, 32.0, 36.0, 39.0, 37.0, 54.0, 64.0, 43.0, 62.0, 46.0, 43.0, 56.0, 44.0, 49.0, 34.0, 28.0, 23.0, 36.0, 26.0, 25.0, 10.0, 12.0, 8.0, 7.0, 5.0, 11.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.1158905029296875, -1.078460693359375, -1.0410308837890625, -1.00360107421875, -0.9661712646484375, -0.928741455078125, -0.8913116455078125, -0.8538818359375, -0.8164520263671875, -0.779022216796875, -0.7415924072265625, -0.70416259765625, -0.6667327880859375, -0.629302978515625, -0.5918731689453125, -0.554443359375, -0.5170135498046875, -0.479583740234375, -0.4421539306640625, -0.40472412109375, -0.3672943115234375, -0.329864501953125, -0.2924346923828125, -0.2550048828125, -0.2175750732421875, -0.180145263671875, -0.1427154541015625, -0.10528564453125, -0.0678558349609375, -0.030426025390625, 0.0070037841796875, 0.04443359375, 0.0818634033203125, 0.119293212890625, 0.1567230224609375, 0.19415283203125, 0.2315826416015625, 0.269012451171875, 0.3064422607421875, 0.3438720703125, 0.3813018798828125, 0.418731689453125, 0.4561614990234375, 0.49359130859375, 0.5310211181640625, 0.568450927734375, 0.6058807373046875, 0.643310546875, 0.6807403564453125, 0.718170166015625, 0.7555999755859375, 0.79302978515625, 0.8304595947265625, 0.867889404296875, 0.9053192138671875, 0.9427490234375, 0.9801788330078125, 1.017608642578125, 1.0550384521484375, 1.09246826171875, 1.1298980712890625, 1.167327880859375, 1.2047576904296875, 1.2421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 12.0, 10.0, 14.0, 22.0, 31.0, 34.0, 71.0, 71.0, 119.0, 159.0, 218.0, 304.0, 489.0, 853.0, 1670.0, 3677.0, 9822.0, 30534.0, 112140.0, 565215.0, 232194.0, 60923.0, 17930.0, 6252.0, 2570.0, 1227.0, 657.0, 377.0, 268.0, 185.0, 124.0, 75.0, 71.0, 42.0, 39.0, 37.0, 21.0, 21.0, 9.0, 11.0, 9.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.60546875, -2.525970458984375, -2.44647216796875, -2.366973876953125, -2.2874755859375, -2.207977294921875, -2.12847900390625, -2.048980712890625, -1.969482421875, -1.889984130859375, -1.81048583984375, -1.730987548828125, -1.6514892578125, -1.571990966796875, -1.49249267578125, -1.412994384765625, -1.33349609375, -1.253997802734375, -1.17449951171875, -1.095001220703125, -1.0155029296875, -0.936004638671875, -0.85650634765625, -0.777008056640625, -0.697509765625, -0.618011474609375, -0.53851318359375, -0.459014892578125, -0.3795166015625, -0.300018310546875, -0.22052001953125, -0.141021728515625, -0.0615234375, 0.017974853515625, 0.09747314453125, 0.176971435546875, 0.2564697265625, 0.335968017578125, 0.41546630859375, 0.494964599609375, 0.574462890625, 0.653961181640625, 0.73345947265625, 0.812957763671875, 0.8924560546875, 0.971954345703125, 1.05145263671875, 1.130950927734375, 1.21044921875, 1.289947509765625, 1.36944580078125, 1.448944091796875, 1.5284423828125, 1.607940673828125, 1.68743896484375, 1.766937255859375, 1.846435546875, 1.925933837890625, 2.00543212890625, 2.084930419921875, 2.1644287109375, 2.243927001953125, 2.32342529296875, 2.402923583984375, 2.482421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 20.0, 12.0, 8.0, 18.0, 28.0, 27.0, 32.0, 32.0, 41.0, 55.0, 60.0, 59.0, 58.0, 54.0, 49.0, 57.0, 52.0, 44.0, 42.0, 39.0, 34.0, 28.0, 23.0, 31.0, 17.0, 12.0, 12.0, 11.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.60821533203125, -4.4625244140625, -4.31683349609375, -4.171142578125, -4.02545166015625, -3.8797607421875, -3.73406982421875, -3.58837890625, -3.44268798828125, -3.2969970703125, -3.15130615234375, -3.005615234375, -2.85992431640625, -2.7142333984375, -2.56854248046875, -2.4228515625, -2.27716064453125, -2.1314697265625, -1.98577880859375, -1.840087890625, -1.69439697265625, -1.5487060546875, -1.40301513671875, -1.25732421875, -1.11163330078125, -0.9659423828125, -0.82025146484375, -0.674560546875, -0.52886962890625, -0.3831787109375, -0.23748779296875, -0.091796875, 0.05389404296875, 0.1995849609375, 0.34527587890625, 0.490966796875, 0.63665771484375, 0.7823486328125, 0.92803955078125, 1.07373046875, 1.21942138671875, 1.3651123046875, 1.51080322265625, 1.656494140625, 1.80218505859375, 1.9478759765625, 2.09356689453125, 2.2392578125, 2.38494873046875, 2.5306396484375, 2.67633056640625, 2.822021484375, 2.96771240234375, 3.1134033203125, 3.25909423828125, 3.40478515625, 3.55047607421875, 3.6961669921875, 3.84185791015625, 3.987548828125, 4.13323974609375, 4.2789306640625, 4.42462158203125, 4.5703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 2.0, 6.0, 3.0, 10.0, 6.0, 16.0, 20.0, 17.0, 21.0, 49.0, 44.0, 70.0, 76.0, 132.0, 175.0, 310.0, 518.0, 996.0, 1900.0, 4213.0, 10508.0, 29379.0, 97141.0, 577568.0, 231069.0, 60680.0, 19753.0, 7206.0, 3063.0, 1476.0, 787.0, 439.0, 286.0, 177.0, 116.0, 91.0, 63.0, 40.0, 28.0, 22.0, 22.0, 5.0, 9.0, 10.0, 12.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.765625, -0.74298095703125, -0.7203369140625, -0.69769287109375, -0.675048828125, -0.65240478515625, -0.6297607421875, -0.60711669921875, -0.58447265625, -0.56182861328125, -0.5391845703125, -0.51654052734375, -0.493896484375, -0.47125244140625, -0.4486083984375, -0.42596435546875, -0.4033203125, -0.38067626953125, -0.3580322265625, -0.33538818359375, -0.312744140625, -0.29010009765625, -0.2674560546875, -0.24481201171875, -0.22216796875, -0.19952392578125, -0.1768798828125, -0.15423583984375, -0.131591796875, -0.10894775390625, -0.0863037109375, -0.06365966796875, -0.041015625, -0.01837158203125, 0.0042724609375, 0.02691650390625, 0.049560546875, 0.07220458984375, 0.0948486328125, 0.11749267578125, 0.14013671875, 0.16278076171875, 0.1854248046875, 0.20806884765625, 0.230712890625, 0.25335693359375, 0.2760009765625, 0.29864501953125, 0.3212890625, 0.34393310546875, 0.3665771484375, 0.38922119140625, 0.411865234375, 0.43450927734375, 0.4571533203125, 0.47979736328125, 0.50244140625, 0.52508544921875, 0.5477294921875, 0.57037353515625, 0.593017578125, 0.61566162109375, 0.6383056640625, 0.66094970703125, 0.68359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 18.0, 24.0, 27.0, 28.0, 40.0, 64.0, 87.0, 124.0, 147.0, 103.0, 75.0, 63.0, 34.0, 30.0, 25.0, 23.0, 12.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003604888916015625, -0.0003499835729598999, -0.0003394782543182373, -0.0003289729356765747, -0.0003184676170349121, -0.0003079622983932495, -0.0002974569797515869, -0.0002869516611099243, -0.0002764463424682617, -0.0002659410238265991, -0.0002554357051849365, -0.0002449303865432739, -0.00023442506790161133, -0.00022391974925994873, -0.00021341443061828613, -0.00020290911197662354, -0.00019240379333496094, -0.00018189847469329834, -0.00017139315605163574, -0.00016088783740997314, -0.00015038251876831055, -0.00013987720012664795, -0.00012937188148498535, -0.00011886656284332275, -0.00010836124420166016, -9.785592555999756e-05, -8.735060691833496e-05, -7.684528827667236e-05, -6.633996963500977e-05, -5.583465099334717e-05, -4.532933235168457e-05, -3.482401371002197e-05, -2.4318695068359375e-05, -1.3813376426696777e-05, -3.3080577850341797e-06, 7.197260856628418e-06, 1.7702579498291016e-05, 2.8207898139953613e-05, 3.871321678161621e-05, 4.921853542327881e-05, 5.9723854064941406e-05, 7.0229172706604e-05, 8.07344913482666e-05, 9.12398099899292e-05, 0.0001017451286315918, 0.0001122504472732544, 0.000122755765914917, 0.0001332610845565796, 0.0001437664031982422, 0.00015427172183990479, 0.00016477704048156738, 0.00017528235912322998, 0.00018578767776489258, 0.00019629299640655518, 0.00020679831504821777, 0.00021730363368988037, 0.00022780895233154297, 0.00023831427097320557, 0.00024881958961486816, 0.00025932490825653076, 0.00026983022689819336, 0.00028033554553985596, 0.00029084086418151855, 0.00030134618282318115, 0.00031185150146484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 6.0, 15.0, 13.0, 25.0, 34.0, 33.0, 74.0, 114.0, 156.0, 284.0, 445.0, 840.0, 1709.0, 3946.0, 10930.0, 35420.0, 148503.0, 652036.0, 141977.0, 34022.0, 10460.0, 3890.0, 1666.0, 766.0, 435.0, 217.0, 149.0, 114.0, 75.0, 58.0, 35.0, 15.0, 17.0, 16.0, 11.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7783203125, -0.751922607421875, -0.72552490234375, -0.699127197265625, -0.6727294921875, -0.646331787109375, -0.61993408203125, -0.593536376953125, -0.567138671875, -0.540740966796875, -0.51434326171875, -0.487945556640625, -0.4615478515625, -0.435150146484375, -0.40875244140625, -0.382354736328125, -0.35595703125, -0.329559326171875, -0.30316162109375, -0.276763916015625, -0.2503662109375, -0.223968505859375, -0.19757080078125, -0.171173095703125, -0.144775390625, -0.118377685546875, -0.09197998046875, -0.065582275390625, -0.0391845703125, -0.012786865234375, 0.01361083984375, 0.040008544921875, 0.06640625, 0.092803955078125, 0.11920166015625, 0.145599365234375, 0.1719970703125, 0.198394775390625, 0.22479248046875, 0.251190185546875, 0.277587890625, 0.303985595703125, 0.33038330078125, 0.356781005859375, 0.3831787109375, 0.409576416015625, 0.43597412109375, 0.462371826171875, 0.48876953125, 0.515167236328125, 0.54156494140625, 0.567962646484375, 0.5943603515625, 0.620758056640625, 0.64715576171875, 0.673553466796875, 0.699951171875, 0.726348876953125, 0.75274658203125, 0.779144287109375, 0.8055419921875, 0.831939697265625, 0.85833740234375, 0.884735107421875, 0.9111328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 12.0, 13.0, 11.0, 15.0, 20.0, 25.0, 35.0, 46.0, 49.0, 64.0, 74.0, 85.0, 80.0, 83.0, 75.0, 57.0, 49.0, 39.0, 28.0, 25.0, 18.0, 15.0, 10.0, 19.0, 12.0, 3.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1015625, -1.070709228515625, -1.03985595703125, -1.009002685546875, -0.9781494140625, -0.947296142578125, -0.91644287109375, -0.885589599609375, -0.854736328125, -0.823883056640625, -0.79302978515625, -0.762176513671875, -0.7313232421875, -0.700469970703125, -0.66961669921875, -0.638763427734375, -0.60791015625, -0.577056884765625, -0.54620361328125, -0.515350341796875, -0.4844970703125, -0.453643798828125, -0.42279052734375, -0.391937255859375, -0.361083984375, -0.330230712890625, -0.29937744140625, -0.268524169921875, -0.2376708984375, -0.206817626953125, -0.17596435546875, -0.145111083984375, -0.1142578125, -0.083404541015625, -0.05255126953125, -0.021697998046875, 0.0091552734375, 0.040008544921875, 0.07086181640625, 0.101715087890625, 0.132568359375, 0.163421630859375, 0.19427490234375, 0.225128173828125, 0.2559814453125, 0.286834716796875, 0.31768798828125, 0.348541259765625, 0.37939453125, 0.410247802734375, 0.44110107421875, 0.471954345703125, 0.5028076171875, 0.533660888671875, 0.56451416015625, 0.595367431640625, 0.626220703125, 0.657073974609375, 0.68792724609375, 0.718780517578125, 0.7496337890625, 0.780487060546875, 0.81134033203125, 0.842193603515625, 0.873046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 13.0, 9.0, 12.0, 33.0, 24.0, 61.0, 96.0, 227.0, 209.0, 107.0, 80.0, 53.0, 23.0, 22.0, 10.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.340713500976562, -19.66080093383789, -18.98088836669922, -18.300975799560547, -17.621063232421875, -16.941152572631836, -16.261240005493164, -15.581327438354492, -14.90141487121582, -14.221502304077148, -13.541589736938477, -12.861678123474121, -12.18176555633545, -11.501852989196777, -10.821941375732422, -10.14202880859375, -9.462116241455078, -8.782203674316406, -8.102291107177734, -7.422379493713379, -6.742466926574707, -6.062554359436035, -5.3826422691345215, -4.702730178833008, -4.022817611694336, -3.342905282974243, -2.6629929542541504, -1.9830806255340576, -1.3031682968139648, -0.6232559680938721, 0.0566563606262207, 0.7365684509277344, 1.4164810180664062, 2.096393346786499, 2.776305675506592, 3.4562180042266846, 4.136130332946777, 4.816042900085449, 5.495954990386963, 6.175867080688477, 6.855779647827148, 7.53569221496582, 8.215604782104492, 8.895516395568848, 9.57542896270752, 10.255341529846191, 10.935253143310547, 11.615165710449219, 12.29507827758789, 12.974990844726562, 13.654903411865234, 14.33481502532959, 15.014727592468262, 15.694640159606934, 16.37455177307129, 17.05446434020996, 17.734376907348633, 18.414289474487305, 19.094202041625977, 19.77411460876465, 20.454025268554688, 21.13393783569336, 21.81385040283203, 22.493762969970703, 23.173675537109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 13.0, 13.0, 21.0, 16.0, 27.0, 21.0, 27.0, 31.0, 24.0, 32.0, 48.0, 62.0, 97.0, 138.0, 68.0, 46.0, 43.0, 33.0, 27.0, 36.0, 33.0, 28.0, 14.0, 12.0, 10.0, 12.0, 10.0, 11.0, 6.0, 3.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.02457046508789, -19.438522338867188, -18.852474212646484, -18.26642417907715, -17.680376052856445, -17.094327926635742, -16.508277893066406, -15.922229766845703, -15.336181640625, -14.750133514404297, -14.164084434509277, -13.578035354614258, -12.991987228393555, -12.405939102172852, -11.819890022277832, -11.233840942382812, -10.64779281616211, -10.061744689941406, -9.475695610046387, -8.889646530151367, -8.303598403930664, -7.717549800872803, -7.131501197814941, -6.54545259475708, -5.959403991699219, -5.373355388641357, -4.787306785583496, -4.201258182525635, -3.6152095794677734, -3.029160976409912, -2.443112373352051, -1.8570637702941895, -1.2710151672363281, -0.6849665641784668, -0.09891796112060547, 0.48713064193725586, 1.0731792449951172, 1.6592278480529785, 2.24527645111084, 2.831325054168701, 3.4173736572265625, 4.003422260284424, 4.589470863342285, 5.1755194664001465, 5.761568069458008, 6.347616672515869, 6.9336652755737305, 7.519713878631592, 8.105762481689453, 8.691810607910156, 9.277859687805176, 9.863908767700195, 10.449956893920898, 11.036005020141602, 11.622054100036621, 12.20810317993164, 12.794151306152344, 13.380199432373047, 13.966248512268066, 14.552297592163086, 15.138345718383789, 15.724393844604492, 16.310443878173828, 16.89649200439453, 17.482540130615234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 14.0, 29.0, 41.0, 72.0, 111.0, 177.0, 295.0, 506.0, 936.0, 1792.0, 3727.0, 8277.0, 20201.0, 56956.0, 177781.0, 589893.0, 1491019.0, 1224795.0, 424058.0, 125614.0, 40095.0, 14944.0, 6407.0, 3021.0, 1540.0, 771.0, 464.0, 284.0, 177.0, 123.0, 53.0, 35.0, 26.0, 16.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.024322509765625, -0.99493408203125, -0.965545654296875, -0.9361572265625, -0.906768798828125, -0.87738037109375, -0.847991943359375, -0.818603515625, -0.789215087890625, -0.75982666015625, -0.730438232421875, -0.7010498046875, -0.671661376953125, -0.64227294921875, -0.612884521484375, -0.58349609375, -0.554107666015625, -0.52471923828125, -0.495330810546875, -0.4659423828125, -0.436553955078125, -0.40716552734375, -0.377777099609375, -0.348388671875, -0.319000244140625, -0.28961181640625, -0.260223388671875, -0.2308349609375, -0.201446533203125, -0.17205810546875, -0.142669677734375, -0.11328125, -0.083892822265625, -0.05450439453125, -0.025115966796875, 0.0042724609375, 0.033660888671875, 0.06304931640625, 0.092437744140625, 0.121826171875, 0.151214599609375, 0.18060302734375, 0.209991455078125, 0.2393798828125, 0.268768310546875, 0.29815673828125, 0.327545166015625, 0.35693359375, 0.386322021484375, 0.41571044921875, 0.445098876953125, 0.4744873046875, 0.503875732421875, 0.53326416015625, 0.562652587890625, 0.592041015625, 0.621429443359375, 0.65081787109375, 0.680206298828125, 0.7095947265625, 0.738983154296875, 0.76837158203125, 0.797760009765625, 0.8271484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 0.0, 6.0, 8.0, 9.0, 7.0, 12.0, 17.0, 20.0, 16.0, 22.0, 32.0, 39.0, 34.0, 36.0, 45.0, 48.0, 48.0, 46.0, 53.0, 45.0, 52.0, 51.0, 46.0, 44.0, 46.0, 41.0, 30.0, 20.0, 17.0, 23.0, 14.0, 14.0, 10.0, 9.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9805145263671875, -0.945404052734375, -0.9102935791015625, -0.87518310546875, -0.8400726318359375, -0.804962158203125, -0.7698516845703125, -0.7347412109375, -0.6996307373046875, -0.664520263671875, -0.6294097900390625, -0.59429931640625, -0.5591888427734375, -0.524078369140625, -0.4889678955078125, -0.453857421875, -0.4187469482421875, -0.383636474609375, -0.3485260009765625, -0.31341552734375, -0.2783050537109375, -0.243194580078125, -0.2080841064453125, -0.1729736328125, -0.1378631591796875, -0.102752685546875, -0.0676422119140625, -0.03253173828125, 0.0025787353515625, 0.037689208984375, 0.0727996826171875, 0.10791015625, 0.1430206298828125, 0.178131103515625, 0.2132415771484375, 0.24835205078125, 0.2834625244140625, 0.318572998046875, 0.3536834716796875, 0.3887939453125, 0.4239044189453125, 0.459014892578125, 0.4941253662109375, 0.52923583984375, 0.5643463134765625, 0.599456787109375, 0.6345672607421875, 0.669677734375, 0.7047882080078125, 0.739898681640625, 0.7750091552734375, 0.81011962890625, 0.8452301025390625, 0.880340576171875, 0.9154510498046875, 0.9505615234375, 0.9856719970703125, 1.020782470703125, 1.0558929443359375, 1.09100341796875, 1.1261138916015625, 1.161224365234375, 1.1963348388671875, 1.2314453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 31.0, 47.0, 68.0, 138.0, 272.0, 641.0, 2427.0, 16022.0, 292653.0, 3720221.0, 148473.0, 10315.0, 1837.0, 548.0, 233.0, 110.0, 70.0, 42.0, 27.0, 21.0, 14.0, 9.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55078125, -3.4300537109375, -3.309326171875, -3.1885986328125, -3.06787109375, -2.9471435546875, -2.826416015625, -2.7056884765625, -2.5849609375, -2.4642333984375, -2.343505859375, -2.2227783203125, -2.10205078125, -1.9813232421875, -1.860595703125, -1.7398681640625, -1.619140625, -1.4984130859375, -1.377685546875, -1.2569580078125, -1.13623046875, -1.0155029296875, -0.894775390625, -0.7740478515625, -0.6533203125, -0.5325927734375, -0.411865234375, -0.2911376953125, -0.17041015625, -0.0496826171875, 0.071044921875, 0.1917724609375, 0.3125, 0.4332275390625, 0.553955078125, 0.6746826171875, 0.79541015625, 0.9161376953125, 1.036865234375, 1.1575927734375, 1.2783203125, 1.3990478515625, 1.519775390625, 1.6405029296875, 1.76123046875, 1.8819580078125, 2.002685546875, 2.1234130859375, 2.244140625, 2.3648681640625, 2.485595703125, 2.6063232421875, 2.72705078125, 2.8477783203125, 2.968505859375, 3.0892333984375, 3.2099609375, 3.3306884765625, 3.451416015625, 3.5721435546875, 3.69287109375, 3.8135986328125, 3.934326171875, 4.0550537109375, 4.17578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 8.0, 16.0, 17.0, 27.0, 24.0, 44.0, 43.0, 71.0, 95.0, 155.0, 229.0, 326.0, 483.0, 537.0, 574.0, 442.0, 309.0, 211.0, 131.0, 95.0, 57.0, 43.0, 30.0, 24.0, 16.0, 17.0, 8.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.26171875, -2.188629150390625, -2.11553955078125, -2.042449951171875, -1.9693603515625, -1.896270751953125, -1.82318115234375, -1.750091552734375, -1.677001953125, -1.603912353515625, -1.53082275390625, -1.457733154296875, -1.3846435546875, -1.311553955078125, -1.23846435546875, -1.165374755859375, -1.09228515625, -1.019195556640625, -0.94610595703125, -0.873016357421875, -0.7999267578125, -0.726837158203125, -0.65374755859375, -0.580657958984375, -0.507568359375, -0.434478759765625, -0.36138916015625, -0.288299560546875, -0.2152099609375, -0.142120361328125, -0.06903076171875, 0.004058837890625, 0.0771484375, 0.150238037109375, 0.22332763671875, 0.296417236328125, 0.3695068359375, 0.442596435546875, 0.51568603515625, 0.588775634765625, 0.661865234375, 0.734954833984375, 0.80804443359375, 0.881134033203125, 0.9542236328125, 1.027313232421875, 1.10040283203125, 1.173492431640625, 1.24658203125, 1.319671630859375, 1.39276123046875, 1.465850830078125, 1.5389404296875, 1.612030029296875, 1.68511962890625, 1.758209228515625, 1.831298828125, 1.904388427734375, 1.97747802734375, 2.050567626953125, 2.1236572265625, 2.196746826171875, 2.26983642578125, 2.342926025390625, 2.416015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 1.0, 5.0, 6.0, 27.0, 58.0, 109.0, 195.0, 238.0, 182.0, 110.0, 37.0, 11.0, 11.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.34957504272461, -17.300260543823242, -16.250946044921875, -15.20163345336914, -14.152318954467773, -13.103004455566406, -12.053690910339355, -11.004377365112305, -9.955062866210938, -8.90574836730957, -7.8564348220825195, -6.8071208000183105, -5.757806777954102, -4.708492755889893, -3.6591787338256836, -2.6098647117614746, -1.5605506896972656, -0.5112366676330566, 0.5380773544311523, 1.5873913764953613, 2.6367053985595703, 3.6860194206237793, 4.735333442687988, 5.784647464752197, 6.833961486816406, 7.883275508880615, 8.932589530944824, 9.981903076171875, 11.031217575073242, 12.08053207397461, 13.12984561920166, 14.179159164428711, 15.228477478027344, 16.27779197692871, 17.327106475830078, 18.376419067382812, 19.42573356628418, 20.475048065185547, 21.52436065673828, 22.57367515563965, 23.622989654541016, 24.672304153442383, 25.72161865234375, 26.770931243896484, 27.82024574279785, 28.86956024169922, 29.918872833251953, 30.96818733215332, 32.01750183105469, 33.06681442260742, 34.11613082885742, 35.165443420410156, 36.214759826660156, 37.26407241821289, 38.313385009765625, 39.362701416015625, 40.41201400756836, 41.461326599121094, 42.510643005371094, 43.55995559692383, 44.60926818847656, 45.65858459472656, 46.7078971862793, 47.7572135925293, 48.80652618408203]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 11.0, 5.0, 11.0, 12.0, 17.0, 20.0, 28.0, 24.0, 29.0, 25.0, 30.0, 16.0, 39.0, 41.0, 48.0, 46.0, 35.0, 27.0, 53.0, 37.0, 34.0, 37.0, 49.0, 47.0, 37.0, 25.0, 42.0, 20.0, 34.0, 14.0, 20.0, 17.0, 20.0, 17.0, 11.0, 4.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1329345703125, -11.789010047912598, -11.445085525512695, -11.101161003112793, -10.75723648071289, -10.413312911987305, -10.069388389587402, -9.7254638671875, -9.381539344787598, -9.037614822387695, -8.693690299987793, -8.34976577758789, -8.005842208862305, -7.661917209625244, -7.3179931640625, -6.974068641662598, -6.630144119262695, -6.286219596862793, -5.942295074462891, -5.5983710289001465, -5.254446506500244, -4.910521984100342, -4.566597938537598, -4.222673416137695, -3.878748893737793, -3.5348243713378906, -3.1909000873565674, -2.846975803375244, -2.503051280975342, -2.1591267585754395, -1.8152024745941162, -1.471278190612793, -1.1273527145385742, -0.7834283113479614, -0.43950390815734863, -0.09557950496673584, 0.24834489822387695, 0.5922693014144897, 0.9361937046051025, 1.2801179885864258, 1.6240425109863281, 1.967966914176941, 2.3118913173675537, 2.655815601348877, 2.9997401237487793, 3.3436646461486816, 3.687588930130005, 4.031513214111328, 4.3754377365112305, 4.719362258911133, 5.063286781311035, 5.407210826873779, 5.751135349273682, 6.095059871673584, 6.438983917236328, 6.7829084396362305, 7.126832962036133, 7.470757484436035, 7.8146820068359375, 8.15860652923584, 8.502531051635742, 8.846454620361328, 9.19037914276123, 9.534303665161133, 9.878228187561035]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 15.0, 13.0, 27.0, 50.0, 84.0, 135.0, 159.0, 288.0, 422.0, 610.0, 1056.0, 1584.0, 2684.0, 4443.0, 7769.0, 14268.0, 26968.0, 52934.0, 110498.0, 225874.0, 280177.0, 160509.0, 75955.0, 37132.0, 19454.0, 10408.0, 5796.0, 3587.0, 2031.0, 1258.0, 820.0, 517.0, 336.0, 204.0, 147.0, 104.0, 73.0, 57.0, 30.0, 20.0, 5.0, 5.0, 3.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-1.8017578125, -1.750640869140625, -1.69952392578125, -1.648406982421875, -1.5972900390625, -1.546173095703125, -1.49505615234375, -1.443939208984375, -1.392822265625, -1.341705322265625, -1.29058837890625, -1.239471435546875, -1.1883544921875, -1.137237548828125, -1.08612060546875, -1.035003662109375, -0.98388671875, -0.932769775390625, -0.88165283203125, -0.830535888671875, -0.7794189453125, -0.728302001953125, -0.67718505859375, -0.626068115234375, -0.574951171875, -0.523834228515625, -0.47271728515625, -0.421600341796875, -0.3704833984375, -0.319366455078125, -0.26824951171875, -0.217132568359375, -0.166015625, -0.114898681640625, -0.06378173828125, -0.012664794921875, 0.0384521484375, 0.089569091796875, 0.14068603515625, 0.191802978515625, 0.242919921875, 0.294036865234375, 0.34515380859375, 0.396270751953125, 0.4473876953125, 0.498504638671875, 0.54962158203125, 0.600738525390625, 0.65185546875, 0.702972412109375, 0.75408935546875, 0.805206298828125, 0.8563232421875, 0.907440185546875, 0.95855712890625, 1.009674072265625, 1.060791015625, 1.111907958984375, 1.16302490234375, 1.214141845703125, 1.2652587890625, 1.316375732421875, 1.36749267578125, 1.418609619140625, 1.4697265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 10.0, 3.0, 6.0, 7.0, 8.0, 8.0, 11.0, 21.0, 13.0, 30.0, 22.0, 26.0, 23.0, 33.0, 38.0, 22.0, 23.0, 42.0, 38.0, 46.0, 52.0, 50.0, 47.0, 36.0, 38.0, 27.0, 44.0, 30.0, 27.0, 22.0, 32.0, 20.0, 20.0, 19.0, 12.0, 12.0, 13.0, 10.0, 7.0, 9.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.93603515625, -0.9051132202148438, -0.8741912841796875, -0.8432693481445312, -0.812347412109375, -0.7814254760742188, -0.7505035400390625, -0.7195816040039062, -0.68865966796875, -0.6577377319335938, -0.6268157958984375, -0.5958938598632812, -0.564971923828125, -0.5340499877929688, -0.5031280517578125, -0.47220611572265625, -0.4412841796875, -0.41036224365234375, -0.3794403076171875, -0.34851837158203125, -0.317596435546875, -0.28667449951171875, -0.2557525634765625, -0.22483062744140625, -0.19390869140625, -0.16298675537109375, -0.1320648193359375, -0.10114288330078125, -0.070220947265625, -0.03929901123046875, -0.0083770751953125, 0.02254486083984375, 0.053466796875, 0.08438873291015625, 0.1153106689453125, 0.14623260498046875, 0.177154541015625, 0.20807647705078125, 0.2389984130859375, 0.26992034912109375, 0.30084228515625, 0.33176422119140625, 0.3626861572265625, 0.39360809326171875, 0.424530029296875, 0.45545196533203125, 0.4863739013671875, 0.5172958374023438, 0.5482177734375, 0.5791397094726562, 0.6100616455078125, 0.6409835815429688, 0.671905517578125, 0.7028274536132812, 0.7337493896484375, 0.7646713256835938, 0.79559326171875, 0.8265151977539062, 0.8574371337890625, 0.8883590698242188, 0.919281005859375, 0.9502029418945312, 0.9811248779296875, 1.0120468139648438, 1.04296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 11.0, 12.0, 11.0, 13.0, 31.0, 33.0, 34.0, 63.0, 61.0, 108.0, 156.0, 212.0, 316.0, 490.0, 857.0, 1684.0, 4142.0, 13515.0, 68983.0, 684425.0, 224801.0, 34384.0, 8044.0, 2886.0, 1265.0, 688.0, 404.0, 271.0, 176.0, 119.0, 101.0, 66.0, 36.0, 46.0, 30.0, 15.0, 21.0, 4.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0], "bins": [-4.1484375, -4.03570556640625, -3.9229736328125, -3.81024169921875, -3.697509765625, -3.58477783203125, -3.4720458984375, -3.35931396484375, -3.24658203125, -3.13385009765625, -3.0211181640625, -2.90838623046875, -2.795654296875, -2.68292236328125, -2.5701904296875, -2.45745849609375, -2.3447265625, -2.23199462890625, -2.1192626953125, -2.00653076171875, -1.893798828125, -1.78106689453125, -1.6683349609375, -1.55560302734375, -1.44287109375, -1.33013916015625, -1.2174072265625, -1.10467529296875, -0.991943359375, -0.87921142578125, -0.7664794921875, -0.65374755859375, -0.541015625, -0.42828369140625, -0.3155517578125, -0.20281982421875, -0.090087890625, 0.02264404296875, 0.1353759765625, 0.24810791015625, 0.36083984375, 0.47357177734375, 0.5863037109375, 0.69903564453125, 0.811767578125, 0.92449951171875, 1.0372314453125, 1.14996337890625, 1.2626953125, 1.37542724609375, 1.4881591796875, 1.60089111328125, 1.713623046875, 1.82635498046875, 1.9390869140625, 2.05181884765625, 2.16455078125, 2.27728271484375, 2.3900146484375, 2.50274658203125, 2.615478515625, 2.72821044921875, 2.8409423828125, 2.95367431640625, 3.06640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 9.0, 13.0, 11.0, 13.0, 14.0, 23.0, 19.0, 36.0, 36.0, 38.0, 52.0, 60.0, 73.0, 77.0, 73.0, 61.0, 64.0, 66.0, 52.0, 36.0, 39.0, 32.0, 23.0, 21.0, 11.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.95703125, -5.783447265625, -5.60986328125, -5.436279296875, -5.2626953125, -5.089111328125, -4.91552734375, -4.741943359375, -4.568359375, -4.394775390625, -4.22119140625, -4.047607421875, -3.8740234375, -3.700439453125, -3.52685546875, -3.353271484375, -3.1796875, -3.006103515625, -2.83251953125, -2.658935546875, -2.4853515625, -2.311767578125, -2.13818359375, -1.964599609375, -1.791015625, -1.617431640625, -1.44384765625, -1.270263671875, -1.0966796875, -0.923095703125, -0.74951171875, -0.575927734375, -0.40234375, -0.228759765625, -0.05517578125, 0.118408203125, 0.2919921875, 0.465576171875, 0.63916015625, 0.812744140625, 0.986328125, 1.159912109375, 1.33349609375, 1.507080078125, 1.6806640625, 1.854248046875, 2.02783203125, 2.201416015625, 2.375, 2.548583984375, 2.72216796875, 2.895751953125, 3.0693359375, 3.242919921875, 3.41650390625, 3.590087890625, 3.763671875, 3.937255859375, 4.11083984375, 4.284423828125, 4.4580078125, 4.631591796875, 4.80517578125, 4.978759765625, 5.15234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 14.0, 21.0, 32.0, 40.0, 43.0, 77.0, 114.0, 209.0, 293.0, 616.0, 1152.0, 2633.0, 7276.0, 24870.0, 100615.0, 666028.0, 183734.0, 42228.0, 11495.0, 3657.0, 1557.0, 752.0, 418.0, 222.0, 130.0, 109.0, 51.0, 44.0, 22.0, 19.0, 13.0, 12.0, 10.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5845489501953125, -0.562652587890625, -0.5407562255859375, -0.51885986328125, -0.4969635009765625, -0.475067138671875, -0.4531707763671875, -0.4312744140625, -0.4093780517578125, -0.387481689453125, -0.3655853271484375, -0.34368896484375, -0.3217926025390625, -0.299896240234375, -0.2779998779296875, -0.256103515625, -0.2342071533203125, -0.212310791015625, -0.1904144287109375, -0.16851806640625, -0.1466217041015625, -0.124725341796875, -0.1028289794921875, -0.0809326171875, -0.0590362548828125, -0.037139892578125, -0.0152435302734375, 0.00665283203125, 0.0285491943359375, 0.050445556640625, 0.0723419189453125, 0.09423828125, 0.1161346435546875, 0.138031005859375, 0.1599273681640625, 0.18182373046875, 0.2037200927734375, 0.225616455078125, 0.2475128173828125, 0.2694091796875, 0.2913055419921875, 0.313201904296875, 0.3350982666015625, 0.35699462890625, 0.3788909912109375, 0.400787353515625, 0.4226837158203125, 0.444580078125, 0.4664764404296875, 0.488372802734375, 0.5102691650390625, 0.53216552734375, 0.5540618896484375, 0.575958251953125, 0.5978546142578125, 0.6197509765625, 0.6416473388671875, 0.663543701171875, 0.6854400634765625, 0.70733642578125, 0.7292327880859375, 0.751129150390625, 0.7730255126953125, 0.794921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 19.0, 28.0, 35.0, 39.0, 59.0, 72.0, 100.0, 129.0, 117.0, 108.0, 75.0, 50.0, 37.0, 33.0, 23.0, 15.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027680397033691406, -0.0002661310136318207, -0.0002554580569267273, -0.0002447851002216339, -0.00023411214351654053, -0.00022343918681144714, -0.00021276623010635376, -0.00020209327340126038, -0.000191420316696167, -0.0001807473599910736, -0.00017007440328598022, -0.00015940144658088684, -0.00014872848987579346, -0.00013805553317070007, -0.0001273825764656067, -0.0001167096197605133, -0.00010603666305541992, -9.536370635032654e-05, -8.469074964523315e-05, -7.401779294013977e-05, -6.334483623504639e-05, -5.2671879529953e-05, -4.199892282485962e-05, -3.1325966119766235e-05, -2.065300941467285e-05, -9.980052709579468e-06, 6.92903995513916e-07, 1.13658607006073e-05, 2.2038817405700684e-05, 3.271177411079407e-05, 4.338473081588745e-05, 5.4057687520980835e-05, 6.473064422607422e-05, 7.54036009311676e-05, 8.607655763626099e-05, 9.674951434135437e-05, 0.00010742247104644775, 0.00011809542775154114, 0.00012876838445663452, 0.0001394413411617279, 0.0001501142978668213, 0.00016078725457191467, 0.00017146021127700806, 0.00018213316798210144, 0.00019280612468719482, 0.0002034790813922882, 0.0002141520380973816, 0.00022482499480247498, 0.00023549795150756836, 0.00024617090821266174, 0.0002568438649177551, 0.0002675168216228485, 0.0002781897783279419, 0.0002888627350330353, 0.00029953569173812866, 0.00031020864844322205, 0.00032088160514831543, 0.0003315545618534088, 0.0003422275185585022, 0.0003529004752635956, 0.00036357343196868896, 0.00037424638867378235, 0.00038491934537887573, 0.0003955923020839691, 0.0004062652587890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 10.0, 15.0, 12.0, 29.0, 26.0, 43.0, 54.0, 99.0, 153.0, 256.0, 453.0, 944.0, 2116.0, 6334.0, 26309.0, 160875.0, 725179.0, 99818.0, 17563.0, 4734.0, 1693.0, 806.0, 391.0, 212.0, 133.0, 97.0, 45.0, 36.0, 26.0, 27.0, 11.0, 11.0, 8.0, 8.0, 6.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82080078125, -0.7946395874023438, -0.7684783935546875, -0.7423171997070312, -0.716156005859375, -0.6899948120117188, -0.6638336181640625, -0.6376724243164062, -0.61151123046875, -0.5853500366210938, -0.5591888427734375, -0.5330276489257812, -0.506866455078125, -0.48070526123046875, -0.4545440673828125, -0.42838287353515625, -0.4022216796875, -0.37606048583984375, -0.3498992919921875, -0.32373809814453125, -0.297576904296875, -0.27141571044921875, -0.2452545166015625, -0.21909332275390625, -0.19293212890625, -0.16677093505859375, -0.1406097412109375, -0.11444854736328125, -0.088287353515625, -0.06212615966796875, -0.0359649658203125, -0.00980377197265625, 0.016357421875, 0.04251861572265625, 0.0686798095703125, 0.09484100341796875, 0.121002197265625, 0.14716339111328125, 0.1733245849609375, 0.19948577880859375, 0.22564697265625, 0.25180816650390625, 0.2779693603515625, 0.30413055419921875, 0.330291748046875, 0.35645294189453125, 0.3826141357421875, 0.40877532958984375, 0.4349365234375, 0.46109771728515625, 0.4872589111328125, 0.5134201049804688, 0.539581298828125, 0.5657424926757812, 0.5919036865234375, 0.6180648803710938, 0.64422607421875, 0.6703872680664062, 0.6965484619140625, 0.7227096557617188, 0.748870849609375, 0.7750320434570312, 0.8011932373046875, 0.8273544311523438, 0.853515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 8.0, 15.0, 7.0, 20.0, 19.0, 22.0, 16.0, 37.0, 55.0, 51.0, 60.0, 71.0, 54.0, 74.0, 59.0, 63.0, 74.0, 57.0, 42.0, 34.0, 36.0, 19.0, 21.0, 16.0, 9.0, 11.0, 10.0, 4.0, 7.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59130859375, -0.5698623657226562, -0.5484161376953125, -0.5269699096679688, -0.505523681640625, -0.48407745361328125, -0.4626312255859375, -0.44118499755859375, -0.41973876953125, -0.39829254150390625, -0.3768463134765625, -0.35540008544921875, -0.333953857421875, -0.31250762939453125, -0.2910614013671875, -0.26961517333984375, -0.2481689453125, -0.22672271728515625, -0.2052764892578125, -0.18383026123046875, -0.162384033203125, -0.14093780517578125, -0.1194915771484375, -0.09804534912109375, -0.07659912109375, -0.05515289306640625, -0.0337066650390625, -0.01226043701171875, 0.009185791015625, 0.03063201904296875, 0.0520782470703125, 0.07352447509765625, 0.094970703125, 0.11641693115234375, 0.1378631591796875, 0.15930938720703125, 0.180755615234375, 0.20220184326171875, 0.2236480712890625, 0.24509429931640625, 0.26654052734375, 0.28798675537109375, 0.3094329833984375, 0.33087921142578125, 0.352325439453125, 0.37377166748046875, 0.3952178955078125, 0.41666412353515625, 0.4381103515625, 0.45955657958984375, 0.4810028076171875, 0.5024490356445312, 0.523895263671875, 0.5453414916992188, 0.5667877197265625, 0.5882339477539062, 0.60968017578125, 0.6311264038085938, 0.6525726318359375, 0.6740188598632812, 0.695465087890625, 0.7169113159179688, 0.7383575439453125, 0.7598037719726562, 0.78125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 16.0, 18.0, 56.0, 117.0, 362.0, 223.0, 101.0, 50.0, 19.0, 16.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.81583786010742, -43.74491882324219, -42.67399597167969, -41.60307693481445, -40.53215789794922, -39.46123504638672, -38.390316009521484, -37.31939697265625, -36.24847412109375, -35.177555084228516, -34.106632232666016, -33.03571319580078, -31.964794158935547, -30.89387321472168, -29.822952270507812, -28.752033233642578, -27.681114196777344, -26.610193252563477, -25.539274215698242, -24.468353271484375, -23.39743423461914, -22.326513290405273, -21.255592346191406, -20.184673309326172, -19.113752365112305, -18.042831420898438, -16.971912384033203, -15.900991439819336, -14.830071449279785, -13.759151458740234, -12.688230514526367, -11.617310523986816, -10.546388626098633, -9.475468635559082, -8.404548645019531, -7.333627700805664, -6.262707710266113, -5.1917877197265625, -4.1208672523498535, -3.0499467849731445, -1.9790267944335938, -0.9081065654754639, 0.16281366348266602, 1.233733892440796, 2.304654121398926, 3.3755741119384766, 4.4464945793151855, 5.5174150466918945, 6.588335037231445, 7.659255027770996, 8.730175018310547, 9.801095962524414, 10.872015953063965, 11.942935943603516, 13.013856887817383, 14.084776878356934, 15.155696868896484, 16.22661781311035, 17.297536849975586, 18.368457794189453, 19.439376831054688, 20.510297775268555, 21.581218719482422, 22.652137756347656, 23.723058700561523]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 5.0, 0.0, 6.0, 6.0, 6.0, 8.0, 7.0, 8.0, 10.0, 9.0, 16.0, 12.0, 26.0, 21.0, 29.0, 23.0, 27.0, 27.0, 36.0, 97.0, 178.0, 86.0, 44.0, 30.0, 36.0, 17.0, 38.0, 24.0, 19.0, 25.0, 21.0, 19.0, 13.0, 11.0, 10.0, 11.0, 9.0, 5.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-18.386028289794922, -17.867717742919922, -17.349407196044922, -16.831098556518555, -16.312788009643555, -15.794477462768555, -15.276167869567871, -14.757858276367188, -14.239547729492188, -13.721237182617188, -13.202927589416504, -12.68461799621582, -12.16630744934082, -11.64799690246582, -11.129687309265137, -10.611377716064453, -10.093067169189453, -9.574756622314453, -9.05644702911377, -8.538137435913086, -8.019826889038086, -7.501516819000244, -6.983206748962402, -6.4648966789245605, -5.946586608886719, -5.428276538848877, -4.909966468811035, -4.391656398773193, -3.8733463287353516, -3.3550362586975098, -2.836726188659668, -2.318416118621826, -1.8001060485839844, -1.2817959785461426, -0.7634859085083008, -0.24517583847045898, 0.2731342315673828, 0.7914443016052246, 1.3097543716430664, 1.8280644416809082, 2.34637451171875, 2.864684581756592, 3.3829946517944336, 3.9013047218322754, 4.419614791870117, 4.937924861907959, 5.456234931945801, 5.974545001983643, 6.492855072021484, 7.011165142059326, 7.529475212097168, 8.047784805297852, 8.566095352172852, 9.084405899047852, 9.602715492248535, 10.121025085449219, 10.639335632324219, 11.157646179199219, 11.675955772399902, 12.194265365600586, 12.712575912475586, 13.230886459350586, 13.74919605255127, 14.267505645751953, 14.785816192626953]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 16.0, 20.0, 25.0, 53.0, 55.0, 111.0, 176.0, 240.0, 347.0, 545.0, 890.0, 1519.0, 2787.0, 5194.0, 11384.0, 29011.0, 88355.0, 283939.0, 835597.0, 1530565.0, 927123.0, 321501.0, 97700.0, 32116.0, 12242.0, 5642.0, 2848.0, 1609.0, 939.0, 605.0, 379.0, 234.0, 145.0, 118.0, 75.0, 36.0, 42.0, 26.0, 15.0, 4.0, 9.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1953125, -1.15618896484375, -1.1170654296875, -1.07794189453125, -1.038818359375, -0.99969482421875, -0.9605712890625, -0.92144775390625, -0.88232421875, -0.84320068359375, -0.8040771484375, -0.76495361328125, -0.725830078125, -0.68670654296875, -0.6475830078125, -0.60845947265625, -0.5693359375, -0.53021240234375, -0.4910888671875, -0.45196533203125, -0.412841796875, -0.37371826171875, -0.3345947265625, -0.29547119140625, -0.25634765625, -0.21722412109375, -0.1781005859375, -0.13897705078125, -0.099853515625, -0.06072998046875, -0.0216064453125, 0.01751708984375, 0.056640625, 0.09576416015625, 0.1348876953125, 0.17401123046875, 0.213134765625, 0.25225830078125, 0.2913818359375, 0.33050537109375, 0.36962890625, 0.40875244140625, 0.4478759765625, 0.48699951171875, 0.526123046875, 0.56524658203125, 0.6043701171875, 0.64349365234375, 0.6826171875, 0.72174072265625, 0.7608642578125, 0.79998779296875, 0.839111328125, 0.87823486328125, 0.9173583984375, 0.95648193359375, 0.99560546875, 1.03472900390625, 1.0738525390625, 1.11297607421875, 1.152099609375, 1.19122314453125, 1.2303466796875, 1.26947021484375, 1.30859375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 6.0, 16.0, 11.0, 10.0, 13.0, 18.0, 21.0, 18.0, 21.0, 48.0, 37.0, 35.0, 46.0, 49.0, 60.0, 59.0, 43.0, 52.0, 44.0, 40.0, 30.0, 24.0, 34.0, 37.0, 36.0, 17.0, 31.0, 26.0, 12.0, 21.0, 15.0, 9.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0224609375, -0.9902801513671875, -0.958099365234375, -0.9259185791015625, -0.89373779296875, -0.8615570068359375, -0.829376220703125, -0.7971954345703125, -0.7650146484375, -0.7328338623046875, -0.700653076171875, -0.6684722900390625, -0.63629150390625, -0.6041107177734375, -0.571929931640625, -0.5397491455078125, -0.507568359375, -0.4753875732421875, -0.443206787109375, -0.4110260009765625, -0.37884521484375, -0.3466644287109375, -0.314483642578125, -0.2823028564453125, -0.2501220703125, -0.2179412841796875, -0.185760498046875, -0.1535797119140625, -0.12139892578125, -0.0892181396484375, -0.057037353515625, -0.0248565673828125, 0.00732421875, 0.0395050048828125, 0.071685791015625, 0.1038665771484375, 0.13604736328125, 0.1682281494140625, 0.200408935546875, 0.2325897216796875, 0.2647705078125, 0.2969512939453125, 0.329132080078125, 0.3613128662109375, 0.39349365234375, 0.4256744384765625, 0.457855224609375, 0.4900360107421875, 0.522216796875, 0.5543975830078125, 0.586578369140625, 0.6187591552734375, 0.65093994140625, 0.6831207275390625, 0.715301513671875, 0.7474822998046875, 0.7796630859375, 0.8118438720703125, 0.844024658203125, 0.8762054443359375, 0.90838623046875, 0.9405670166015625, 0.972747802734375, 1.0049285888671875, 1.037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 22.0, 24.0, 52.0, 67.0, 121.0, 256.0, 483.0, 1132.0, 3280.0, 23887.0, 3600322.0, 551327.0, 9640.0, 2082.0, 766.0, 367.0, 178.0, 96.0, 67.0, 34.0, 21.0, 13.0, 9.0, 10.0, 2.0, 9.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3160400390625, -6.089111328125, -5.8621826171875, -5.63525390625, -5.4083251953125, -5.181396484375, -4.9544677734375, -4.7275390625, -4.5006103515625, -4.273681640625, -4.0467529296875, -3.81982421875, -3.5928955078125, -3.365966796875, -3.1390380859375, -2.912109375, -2.6851806640625, -2.458251953125, -2.2313232421875, -2.00439453125, -1.7774658203125, -1.550537109375, -1.3236083984375, -1.0966796875, -0.8697509765625, -0.642822265625, -0.4158935546875, -0.18896484375, 0.0379638671875, 0.264892578125, 0.4918212890625, 0.71875, 0.9456787109375, 1.172607421875, 1.3995361328125, 1.62646484375, 1.8533935546875, 2.080322265625, 2.3072509765625, 2.5341796875, 2.7611083984375, 2.988037109375, 3.2149658203125, 3.44189453125, 3.6688232421875, 3.895751953125, 4.1226806640625, 4.349609375, 4.5765380859375, 4.803466796875, 5.0303955078125, 5.25732421875, 5.4842529296875, 5.711181640625, 5.9381103515625, 6.1650390625, 6.3919677734375, 6.618896484375, 6.8458251953125, 7.07275390625, 7.2996826171875, 7.526611328125, 7.7535400390625, 7.98046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 3.0, 10.0, 13.0, 19.0, 39.0, 42.0, 85.0, 122.0, 148.0, 242.0, 352.0, 501.0, 656.0, 622.0, 408.0, 310.0, 176.0, 117.0, 72.0, 50.0, 27.0, 16.0, 8.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.046875, -4.916473388671875, -4.78607177734375, -4.655670166015625, -4.5252685546875, -4.394866943359375, -4.26446533203125, -4.134063720703125, -4.003662109375, -3.873260498046875, -3.74285888671875, -3.612457275390625, -3.4820556640625, -3.351654052734375, -3.22125244140625, -3.090850830078125, -2.96044921875, -2.830047607421875, -2.69964599609375, -2.569244384765625, -2.4388427734375, -2.308441162109375, -2.17803955078125, -2.047637939453125, -1.917236328125, -1.786834716796875, -1.65643310546875, -1.526031494140625, -1.3956298828125, -1.265228271484375, -1.13482666015625, -1.004425048828125, -0.8740234375, -0.743621826171875, -0.61322021484375, -0.482818603515625, -0.3524169921875, -0.222015380859375, -0.09161376953125, 0.038787841796875, 0.169189453125, 0.299591064453125, 0.42999267578125, 0.560394287109375, 0.6907958984375, 0.821197509765625, 0.95159912109375, 1.082000732421875, 1.21240234375, 1.342803955078125, 1.47320556640625, 1.603607177734375, 1.7340087890625, 1.864410400390625, 1.99481201171875, 2.125213623046875, 2.255615234375, 2.386016845703125, 2.51641845703125, 2.646820068359375, 2.7772216796875, 2.907623291015625, 3.03802490234375, 3.168426513671875, 3.298828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 13.0, 30.0, 66.0, 115.0, 216.0, 230.0, 144.0, 82.0, 39.0, 20.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-76.03483581542969, -74.31876373291016, -72.6026840209961, -70.88661193847656, -69.17053985595703, -67.45446014404297, -65.73838806152344, -64.0223159790039, -62.30624008178711, -60.59016418457031, -58.87409210205078, -57.158016204833984, -55.44194030761719, -53.725868225097656, -52.00979232788086, -50.29371643066406, -48.57764434814453, -46.861568450927734, -45.1454963684082, -43.429420471191406, -41.71334457397461, -39.99727249145508, -38.28119659423828, -36.56512451171875, -34.84904479980469, -33.13296890258789, -31.416894912719727, -29.700820922851562, -27.9847469329834, -26.268672943115234, -24.552597045898438, -22.836523056030273, -21.12044906616211, -19.404375076293945, -17.68829917907715, -15.972225189208984, -14.25615119934082, -12.54007625579834, -10.82400131225586, -9.107927322387695, -7.391852378845215, -5.675777912139893, -3.959703207015991, -2.24362850189209, -0.5275540351867676, 1.1885204315185547, 2.904595375061035, 4.620669364929199, 6.33674430847168, 8.05281925201416, 9.768893241882324, 11.484968185424805, 13.201042175292969, 14.91711711883545, 16.63319206237793, 18.349266052246094, 20.06534194946289, 21.781415939331055, 23.49749183654785, 25.213565826416016, 26.92963981628418, 28.645713806152344, 30.36178970336914, 32.07786560058594, 33.79393768310547]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 2.0, 7.0, 3.0, 10.0, 7.0, 11.0, 10.0, 15.0, 16.0, 31.0, 33.0, 25.0, 35.0, 26.0, 38.0, 45.0, 63.0, 61.0, 59.0, 52.0, 54.0, 52.0, 52.0, 49.0, 36.0, 31.0, 42.0, 25.0, 20.0, 24.0, 14.0, 12.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1195068359375, -21.467880249023438, -20.816253662109375, -20.164628982543945, -19.513002395629883, -18.86137580871582, -18.20975112915039, -17.558124542236328, -16.906497955322266, -16.254871368408203, -15.603245735168457, -14.951620101928711, -14.299993515014648, -13.648366928100586, -12.99674129486084, -12.345115661621094, -11.693489074707031, -11.041862487792969, -10.390236854553223, -9.738611221313477, -9.086984634399414, -8.435358047485352, -7.7837324142456055, -7.132106304168701, -6.480480194091797, -5.828854084014893, -5.177227973937988, -4.525601863861084, -3.8739757537841797, -3.2223496437072754, -2.570723533630371, -1.9190974235534668, -1.2674713134765625, -0.6158452033996582, 0.035780906677246094, 0.6874070167541504, 1.3390331268310547, 1.990659236907959, 2.6422853469848633, 3.2939114570617676, 3.945537567138672, 4.597163677215576, 5.2487897872924805, 5.900415897369385, 6.552042007446289, 7.203668117523193, 7.855294227600098, 8.506919860839844, 9.158546447753906, 9.810173034667969, 10.461798667907715, 11.113424301147461, 11.765050888061523, 12.416677474975586, 13.068303108215332, 13.719928741455078, 14.37155532836914, 15.023181915283203, 15.67480754852295, 16.326433181762695, 16.978059768676758, 17.62968635559082, 18.28131103515625, 18.932937622070312, 19.584564208984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 1.0, 7.0, 16.0, 30.0, 33.0, 49.0, 77.0, 111.0, 215.0, 340.0, 584.0, 970.0, 1694.0, 3114.0, 5913.0, 12459.0, 28790.0, 74236.0, 239478.0, 474323.0, 124469.0, 45085.0, 18604.0, 8444.0, 4085.0, 2311.0, 1235.0, 740.0, 429.0, 258.0, 153.0, 114.0, 66.0, 34.0, 28.0, 19.0, 17.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.22265625, -2.1595916748046875, -2.096527099609375, -2.0334625244140625, -1.97039794921875, -1.9073333740234375, -1.844268798828125, -1.7812042236328125, -1.7181396484375, -1.6550750732421875, -1.592010498046875, -1.5289459228515625, -1.46588134765625, -1.4028167724609375, -1.339752197265625, -1.2766876220703125, -1.213623046875, -1.1505584716796875, -1.087493896484375, -1.0244293212890625, -0.96136474609375, -0.8983001708984375, -0.835235595703125, -0.7721710205078125, -0.7091064453125, -0.6460418701171875, -0.582977294921875, -0.5199127197265625, -0.45684814453125, -0.3937835693359375, -0.330718994140625, -0.2676544189453125, -0.20458984375, -0.1415252685546875, -0.078460693359375, -0.0153961181640625, 0.04766845703125, 0.1107330322265625, 0.173797607421875, 0.2368621826171875, 0.2999267578125, 0.3629913330078125, 0.426055908203125, 0.4891204833984375, 0.55218505859375, 0.6152496337890625, 0.678314208984375, 0.7413787841796875, 0.804443359375, 0.8675079345703125, 0.930572509765625, 0.9936370849609375, 1.05670166015625, 1.1197662353515625, 1.182830810546875, 1.2458953857421875, 1.3089599609375, 1.3720245361328125, 1.435089111328125, 1.4981536865234375, 1.56121826171875, 1.6242828369140625, 1.687347412109375, 1.7504119873046875, 1.8134765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 5.0, 6.0, 9.0, 15.0, 19.0, 5.0, 19.0, 21.0, 27.0, 23.0, 26.0, 31.0, 39.0, 38.0, 58.0, 38.0, 54.0, 51.0, 48.0, 50.0, 48.0, 45.0, 44.0, 37.0, 34.0, 33.0, 33.0, 27.0, 13.0, 17.0, 12.0, 8.0, 15.0, 10.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3623046875, -1.3222808837890625, -1.282257080078125, -1.2422332763671875, -1.20220947265625, -1.1621856689453125, -1.122161865234375, -1.0821380615234375, -1.0421142578125, -1.0020904541015625, -0.962066650390625, -0.9220428466796875, -0.88201904296875, -0.8419952392578125, -0.801971435546875, -0.7619476318359375, -0.721923828125, -0.6819000244140625, -0.641876220703125, -0.6018524169921875, -0.56182861328125, -0.5218048095703125, -0.481781005859375, -0.4417572021484375, -0.4017333984375, -0.3617095947265625, -0.321685791015625, -0.2816619873046875, -0.24163818359375, -0.2016143798828125, -0.161590576171875, -0.1215667724609375, -0.08154296875, -0.0415191650390625, -0.001495361328125, 0.0385284423828125, 0.07855224609375, 0.1185760498046875, 0.158599853515625, 0.1986236572265625, 0.2386474609375, 0.2786712646484375, 0.318695068359375, 0.3587188720703125, 0.39874267578125, 0.4387664794921875, 0.478790283203125, 0.5188140869140625, 0.558837890625, 0.5988616943359375, 0.638885498046875, 0.6789093017578125, 0.71893310546875, 0.7589569091796875, 0.798980712890625, 0.8390045166015625, 0.8790283203125, 0.9190521240234375, 0.959075927734375, 0.9990997314453125, 1.03912353515625, 1.0791473388671875, 1.119171142578125, 1.1591949462890625, 1.19921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 11.0, 23.0, 18.0, 12.0, 21.0, 45.0, 63.0, 94.0, 135.0, 253.0, 394.0, 774.0, 1854.0, 5520.0, 26653.0, 593985.0, 383695.0, 25842.0, 5566.0, 1860.0, 714.0, 374.0, 240.0, 119.0, 68.0, 57.0, 48.0, 31.0, 17.0, 18.0, 9.0, 6.0, 4.0, 2.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.884765625, -3.76702880859375, -3.6492919921875, -3.53155517578125, -3.413818359375, -3.29608154296875, -3.1783447265625, -3.06060791015625, -2.94287109375, -2.82513427734375, -2.7073974609375, -2.58966064453125, -2.471923828125, -2.35418701171875, -2.2364501953125, -2.11871337890625, -2.0009765625, -1.88323974609375, -1.7655029296875, -1.64776611328125, -1.530029296875, -1.41229248046875, -1.2945556640625, -1.17681884765625, -1.05908203125, -0.94134521484375, -0.8236083984375, -0.70587158203125, -0.588134765625, -0.47039794921875, -0.3526611328125, -0.23492431640625, -0.1171875, 0.00054931640625, 0.1182861328125, 0.23602294921875, 0.353759765625, 0.47149658203125, 0.5892333984375, 0.70697021484375, 0.82470703125, 0.94244384765625, 1.0601806640625, 1.17791748046875, 1.295654296875, 1.41339111328125, 1.5311279296875, 1.64886474609375, 1.7666015625, 1.88433837890625, 2.0020751953125, 2.11981201171875, 2.237548828125, 2.35528564453125, 2.4730224609375, 2.59075927734375, 2.70849609375, 2.82623291015625, 2.9439697265625, 3.06170654296875, 3.179443359375, 3.29718017578125, 3.4149169921875, 3.53265380859375, 3.650390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 9.0, 8.0, 10.0, 10.0, 13.0, 19.0, 20.0, 26.0, 28.0, 37.0, 29.0, 58.0, 56.0, 74.0, 86.0, 77.0, 74.0, 68.0, 56.0, 37.0, 34.0, 22.0, 20.0, 25.0, 11.0, 11.0, 9.0, 17.0, 13.0, 6.0, 6.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6796875, -5.5029296875, -5.326171875, -5.1494140625, -4.97265625, -4.7958984375, -4.619140625, -4.4423828125, -4.265625, -4.0888671875, -3.912109375, -3.7353515625, -3.55859375, -3.3818359375, -3.205078125, -3.0283203125, -2.8515625, -2.6748046875, -2.498046875, -2.3212890625, -2.14453125, -1.9677734375, -1.791015625, -1.6142578125, -1.4375, -1.2607421875, -1.083984375, -0.9072265625, -0.73046875, -0.5537109375, -0.376953125, -0.2001953125, -0.0234375, 0.1533203125, 0.330078125, 0.5068359375, 0.68359375, 0.8603515625, 1.037109375, 1.2138671875, 1.390625, 1.5673828125, 1.744140625, 1.9208984375, 2.09765625, 2.2744140625, 2.451171875, 2.6279296875, 2.8046875, 2.9814453125, 3.158203125, 3.3349609375, 3.51171875, 3.6884765625, 3.865234375, 4.0419921875, 4.21875, 4.3955078125, 4.572265625, 4.7490234375, 4.92578125, 5.1025390625, 5.279296875, 5.4560546875, 5.6328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 11.0, 11.0, 12.0, 30.0, 29.0, 31.0, 58.0, 86.0, 128.0, 215.0, 428.0, 864.0, 1871.0, 4669.0, 13846.0, 59549.0, 841393.0, 96217.0, 18551.0, 5956.0, 2352.0, 1046.0, 508.0, 239.0, 139.0, 87.0, 51.0, 39.0, 32.0, 20.0, 14.0, 21.0, 18.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.79150390625, -0.7698898315429688, -0.7482757568359375, -0.7266616821289062, -0.705047607421875, -0.6834335327148438, -0.6618194580078125, -0.6402053833007812, -0.61859130859375, -0.5969772338867188, -0.5753631591796875, -0.5537490844726562, -0.532135009765625, -0.5105209350585938, -0.4889068603515625, -0.46729278564453125, -0.4456787109375, -0.42406463623046875, -0.4024505615234375, -0.38083648681640625, -0.359222412109375, -0.33760833740234375, -0.3159942626953125, -0.29438018798828125, -0.27276611328125, -0.25115203857421875, -0.2295379638671875, -0.20792388916015625, -0.186309814453125, -0.16469573974609375, -0.1430816650390625, -0.12146759033203125, -0.099853515625, -0.07823944091796875, -0.0566253662109375, -0.03501129150390625, -0.013397216796875, 0.00821685791015625, 0.0298309326171875, 0.05144500732421875, 0.07305908203125, 0.09467315673828125, 0.1162872314453125, 0.13790130615234375, 0.159515380859375, 0.18112945556640625, 0.2027435302734375, 0.22435760498046875, 0.2459716796875, 0.26758575439453125, 0.2891998291015625, 0.31081390380859375, 0.332427978515625, 0.35404205322265625, 0.3756561279296875, 0.39727020263671875, 0.41888427734375, 0.44049835205078125, 0.4621124267578125, 0.48372650146484375, 0.505340576171875, 0.5269546508789062, 0.5485687255859375, 0.5701828002929688, 0.591796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 5.0, 11.0, 9.0, 18.0, 13.0, 15.0, 27.0, 31.0, 34.0, 47.0, 73.0, 120.0, 120.0, 110.0, 94.0, 69.0, 28.0, 43.0, 26.0, 27.0, 12.0, 7.0, 9.0, 11.0, 7.0, 11.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002486705780029297, -0.00024131685495376587, -0.00023396313190460205, -0.00022660940885543823, -0.00021925568580627441, -0.0002119019627571106, -0.00020454823970794678, -0.00019719451665878296, -0.00018984079360961914, -0.00018248707056045532, -0.0001751333475112915, -0.00016777962446212769, -0.00016042590141296387, -0.00015307217836380005, -0.00014571845531463623, -0.0001383647322654724, -0.0001310110092163086, -0.00012365728616714478, -0.00011630356311798096, -0.00010894984006881714, -0.00010159611701965332, -9.42423939704895e-05, -8.688867092132568e-05, -7.953494787216187e-05, -7.218122482299805e-05, -6.482750177383423e-05, -5.747377872467041e-05, -5.012005567550659e-05, -4.2766332626342773e-05, -3.5412609577178955e-05, -2.8058886528015137e-05, -2.070516347885132e-05, -1.33514404296875e-05, -5.997717380523682e-06, 1.3560056686401367e-06, 8.709728717803955e-06, 1.6063451766967773e-05, 2.3417174816131592e-05, 3.077089786529541e-05, 3.812462091445923e-05, 4.547834396362305e-05, 5.2832067012786865e-05, 6.0185790061950684e-05, 6.75395131111145e-05, 7.489323616027832e-05, 8.224695920944214e-05, 8.960068225860596e-05, 9.695440530776978e-05, 0.0001043081283569336, 0.00011166185140609741, 0.00011901557445526123, 0.00012636929750442505, 0.00013372302055358887, 0.00014107674360275269, 0.0001484304666519165, 0.00015578418970108032, 0.00016313791275024414, 0.00017049163579940796, 0.00017784535884857178, 0.0001851990818977356, 0.00019255280494689941, 0.00019990652799606323, 0.00020726025104522705, 0.00021461397409439087, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 12.0, 11.0, 15.0, 35.0, 35.0, 67.0, 85.0, 131.0, 241.0, 420.0, 795.0, 1702.0, 3906.0, 10603.0, 36027.0, 242603.0, 692884.0, 39414.0, 11563.0, 4323.0, 1700.0, 887.0, 411.0, 240.0, 138.0, 97.0, 54.0, 42.0, 32.0, 16.0, 14.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5478515625, -0.5322151184082031, -0.5165786743164062, -0.5009422302246094, -0.4853057861328125, -0.4696693420410156, -0.45403289794921875, -0.4383964538574219, -0.422760009765625, -0.4071235656738281, -0.39148712158203125, -0.3758506774902344, -0.3602142333984375, -0.3445777893066406, -0.32894134521484375, -0.3133049011230469, -0.29766845703125, -0.2820320129394531, -0.26639556884765625, -0.2507591247558594, -0.2351226806640625, -0.21948623657226562, -0.20384979248046875, -0.18821334838867188, -0.172576904296875, -0.15694046020507812, -0.14130401611328125, -0.12566757202148438, -0.1100311279296875, -0.09439468383789062, -0.07875823974609375, -0.06312179565429688, -0.0474853515625, -0.031848907470703125, -0.01621246337890625, -0.000576019287109375, 0.0150604248046875, 0.030696868896484375, 0.04633331298828125, 0.061969757080078125, 0.077606201171875, 0.09324264526367188, 0.10887908935546875, 0.12451553344726562, 0.1401519775390625, 0.15578842163085938, 0.17142486572265625, 0.18706130981445312, 0.20269775390625, 0.21833419799804688, 0.23397064208984375, 0.24960708618164062, 0.2652435302734375, 0.2808799743652344, 0.29651641845703125, 0.3121528625488281, 0.327789306640625, 0.3434257507324219, 0.35906219482421875, 0.3746986389160156, 0.3903350830078125, 0.4059715270996094, 0.42160797119140625, 0.4372444152832031, 0.452880859375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 1.0, 10.0, 9.0, 16.0, 14.0, 17.0, 33.0, 30.0, 31.0, 56.0, 82.0, 97.0, 116.0, 100.0, 97.0, 71.0, 43.0, 39.0, 29.0, 15.0, 17.0, 17.0, 6.0, 8.0, 5.0, 9.0, 1.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.72705078125, -0.7056045532226562, -0.6841583251953125, -0.6627120971679688, -0.641265869140625, -0.6198196411132812, -0.5983734130859375, -0.5769271850585938, -0.55548095703125, -0.5340347290039062, -0.5125885009765625, -0.49114227294921875, -0.469696044921875, -0.44824981689453125, -0.4268035888671875, -0.40535736083984375, -0.3839111328125, -0.36246490478515625, -0.3410186767578125, -0.31957244873046875, -0.298126220703125, -0.27667999267578125, -0.2552337646484375, -0.23378753662109375, -0.21234130859375, -0.19089508056640625, -0.1694488525390625, -0.14800262451171875, -0.126556396484375, -0.10511016845703125, -0.0836639404296875, -0.06221771240234375, -0.040771484375, -0.01932525634765625, 0.0021209716796875, 0.02356719970703125, 0.045013427734375, 0.06645965576171875, 0.0879058837890625, 0.10935211181640625, 0.13079833984375, 0.15224456787109375, 0.1736907958984375, 0.19513702392578125, 0.216583251953125, 0.23802947998046875, 0.2594757080078125, 0.28092193603515625, 0.3023681640625, 0.32381439208984375, 0.3452606201171875, 0.36670684814453125, 0.388153076171875, 0.40959930419921875, 0.4310455322265625, 0.45249176025390625, 0.47393798828125, 0.49538421630859375, 0.5168304443359375, 0.5382766723632812, 0.559722900390625, 0.5811691284179688, 0.6026153564453125, 0.6240615844726562, 0.6455078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 15.0, 32.0, 66.0, 87.0, 510.0, 127.0, 67.0, 42.0, 22.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.34033966064453, -40.39403533935547, -39.44772720336914, -38.50142288208008, -37.555118560791016, -36.60881042480469, -35.662506103515625, -34.71620178222656, -33.769893646240234, -32.82358932495117, -31.877283096313477, -30.93097686767578, -29.984670639038086, -29.03836441040039, -28.092060089111328, -27.145753860473633, -26.19944953918457, -25.253143310546875, -24.306838989257812, -23.360532760620117, -22.414226531982422, -21.46792221069336, -20.521615982055664, -19.57530975341797, -18.629005432128906, -17.68269920349121, -16.73639488220215, -15.790088653564453, -14.843782424926758, -13.897477149963379, -12.951171875, -12.004865646362305, -11.05855941772461, -10.11225414276123, -9.165947914123535, -8.219642639160156, -7.273336887359619, -6.327031135559082, -5.380725860595703, -4.434420108795166, -3.488114356994629, -2.541808605194092, -1.5955030918121338, -0.6491975784301758, 0.29710817337036133, 1.2434139251708984, 2.1897192001342773, 3.1360249519348145, 4.082330703735352, 5.028636455535889, 5.974942207336426, 6.921247482299805, 7.867553234100342, 8.813858985900879, 9.760164260864258, 10.706470489501953, 11.652775764465332, 12.599081039428711, 13.545387268066406, 14.491692543029785, 15.437997817993164, 16.38430404663086, 17.330608367919922, 18.276914596557617, 19.223220825195312]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 12.0, 15.0, 9.0, 18.0, 8.0, 18.0, 18.0, 27.0, 42.0, 28.0, 32.0, 94.0, 325.0, 100.0, 37.0, 29.0, 20.0, 17.0, 16.0, 20.0, 17.0, 10.0, 18.0, 11.0, 9.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.823379516601562, -18.32134246826172, -17.819303512573242, -17.3172664642334, -16.815227508544922, -16.313190460205078, -15.811152458190918, -15.309114456176758, -14.807076454162598, -14.305038452148438, -13.803000450134277, -13.300962448120117, -12.798925399780273, -12.296886444091797, -11.794849395751953, -11.292811393737793, -10.790773391723633, -10.288735389709473, -9.786697387695312, -9.284659385681152, -8.782621383666992, -8.280584335327148, -7.778546333312988, -7.276508331298828, -6.774470329284668, -6.272432327270508, -5.770394325256348, -5.268356800079346, -4.7663187980651855, -4.264280796051025, -3.7622430324554443, -3.2602052688598633, -2.7581663131713867, -2.2561283111572266, -1.7540905475616455, -1.252052664756775, -0.7500147819519043, -0.24797677993774414, 0.2540609836578369, 0.756098747253418, 1.2581367492675781, 1.7601746320724487, 2.2622125148773193, 2.7642502784729004, 3.2662882804870605, 3.7683262825012207, 4.270363807678223, 4.772401809692383, 5.274439811706543, 5.776477813720703, 6.278515815734863, 6.780553340911865, 7.282591342926025, 7.7846293449401855, 8.286666870117188, 8.788704872131348, 9.290742874145508, 9.792780876159668, 10.294818878173828, 10.796856880187988, 11.298894882202148, 11.800931930541992, 12.302969932556152, 12.805007934570312, 13.307045936584473]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 8.0, 13.0, 7.0, 10.0, 7.0, 9.0, 6.0, 22.0, 12.0, 14.0, 15.0, 24.0, 20.0, 33.0, 41.0, 38.0, 82.0, 184.0, 108.0, 55.0, 28.0, 32.0, 40.0, 23.0, 24.0, 17.0, 14.0, 18.0, 15.0, 9.0, 10.0, 10.0, 10.0, 6.0, 4.0, 5.0, 7.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9736328125, -0.9417266845703125, -0.909820556640625, -0.8779144287109375, -0.84600830078125, -0.8141021728515625, -0.782196044921875, -0.7502899169921875, -0.7183837890625, -0.6864776611328125, -0.654571533203125, -0.6226654052734375, -0.59075927734375, -0.5588531494140625, -0.526947021484375, -0.4950408935546875, -0.463134765625, -0.4312286376953125, -0.399322509765625, -0.3674163818359375, -0.33551025390625, -0.3036041259765625, -0.271697998046875, -0.2397918701171875, -0.2078857421875, -0.1759796142578125, -0.144073486328125, -0.1121673583984375, -0.08026123046875, -0.0483551025390625, -0.016448974609375, 0.0154571533203125, 0.04736328125, 0.0792694091796875, 0.111175537109375, 0.1430816650390625, 0.17498779296875, 0.2068939208984375, 0.238800048828125, 0.2707061767578125, 0.3026123046875, 0.3345184326171875, 0.366424560546875, 0.3983306884765625, 0.43023681640625, 0.4621429443359375, 0.494049072265625, 0.5259552001953125, 0.557861328125, 0.5897674560546875, 0.621673583984375, 0.6535797119140625, 0.68548583984375, 0.7173919677734375, 0.749298095703125, 0.7812042236328125, 0.8131103515625, 0.8450164794921875, 0.876922607421875, 0.9088287353515625, 0.94073486328125, 0.9726409912109375, 1.004547119140625, 1.0364532470703125, 1.068359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 7.0, 0.0, 8.0, 4.0, 9.0, 6.0, 4.0, 15.0, 21.0, 23.0, 45.0, 90.0, 156.0, 321.0, 1052.0, 4136.0, 39021.0, 8331728.0, 8890.0, 1930.0, 564.0, 220.0, 108.0, 63.0, 23.0, 26.0, 22.0, 26.0, 2.0, 7.0, 9.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0], "bins": [-13.309447288513184, -12.883353233337402, -12.457258224487305, -12.031164169311523, -11.605069160461426, -11.178975105285645, -10.752880096435547, -10.326786041259766, -9.900691032409668, -9.474596977233887, -9.048501968383789, -8.622407913208008, -8.19631290435791, -7.770218849182129, -7.344123840332031, -6.91802978515625, -6.4919352531433105, -6.065840721130371, -5.639746189117432, -5.213651657104492, -4.787557125091553, -4.361462593078613, -3.935368299484253, -3.5092737674713135, -3.083179235458374, -2.6570847034454346, -2.230990171432495, -1.8048957586288452, -1.3788012266159058, -0.9527068138122559, -0.5266122817993164, -0.10051774978637695, 0.3255767822265625, 0.751671314239502, 1.1777658462524414, 1.6038602590560913, 2.0299549102783203, 2.4560492038726807, 2.88214373588562, 3.3082382678985596, 3.734332799911499, 4.160427093505859, 4.586521625518799, 5.012616157531738, 5.438710689544678, 5.864805221557617, 6.290899753570557, 6.716994285583496, 7.1430888175964355, 7.569183349609375, 7.9952778816223145, 8.421372413635254, 8.847466468811035, 9.273561477661133, 9.699655532836914, 10.125750541687012, 10.551844596862793, 10.977938652038574, 11.404033660888672, 11.830127716064453, 12.25622272491455, 12.682316780090332, 13.10841178894043, 13.534505844116211, 13.960600852966309]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 1.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.521769523620605, -11.245092391967773, -10.968414306640625, -10.691737174987793, -10.415060043334961, -10.138382911682129, -9.86170482635498, -9.585027694702148, -9.308350563049316, -9.031673431396484, -8.754995346069336, -8.478318214416504, -8.201641082763672, -7.924963474273682, -7.648285865783691, -7.371608734130859, -7.094931125640869, -6.818253517150879, -6.541576385498047, -6.264898777008057, -5.988221645355225, -5.711544036865234, -5.434866905212402, -5.158189296722412, -4.881511688232422, -4.604834079742432, -4.3281569480896, -4.051479339599609, -3.7748022079467773, -3.498124599456787, -3.221447229385376, -2.944769859313965, -2.6680922508239746, -2.3914148807525635, -2.1147375106811523, -1.8380600214004517, -1.5613826513290405, -1.2847052812576294, -1.0080277919769287, -0.7313504219055176, -0.45467305183410645, -0.17799565196037292, 0.0986817479133606, 0.3753591775894165, 0.6520365476608276, 0.9287139177322388, 1.2053914070129395, 1.4820687770843506, 1.7587461471557617, 2.035423517227173, 2.312100887298584, 2.588778495788574, 2.8654556274414062, 3.1421332359313965, 3.4188106060028076, 3.6954879760742188, 3.97216534614563, 4.248842716217041, 4.525520324707031, 4.802197456359863, 5.0788750648498535, 5.3555521965026855, 5.632229804992676, 5.908906936645508, 6.185584545135498]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 7.0, 12.0, 20.0, 20.0, 31.0, 46.0, 55.0, 91.0, 148.0, 253.0, 481.0, 949.0, 2207.0, 5936.0, 16898.0, 51651.0, 158694.0, 189592.0, 64860.0, 20375.0, 7079.0, 2688.0, 991.0, 487.0, 248.0, 144.0, 88.0, 62.0, 40.0, 30.0, 23.0, 10.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-12.6015625, -12.2525634765625, -11.903564453125, -11.5545654296875, -11.20556640625, -10.8565673828125, -10.507568359375, -10.1585693359375, -9.8095703125, -9.4605712890625, -9.111572265625, -8.7625732421875, -8.41357421875, -8.0645751953125, -7.715576171875, -7.3665771484375, -7.017578125, -6.6685791015625, -6.319580078125, -5.9705810546875, -5.62158203125, -5.2725830078125, -4.923583984375, -4.5745849609375, -4.2255859375, -3.8765869140625, -3.527587890625, -3.1785888671875, -2.82958984375, -2.4805908203125, -2.131591796875, -1.7825927734375, -1.43359375, -1.0845947265625, -0.735595703125, -0.3865966796875, -0.03759765625, 0.3114013671875, 0.660400390625, 1.0093994140625, 1.3583984375, 1.7073974609375, 2.056396484375, 2.4053955078125, 2.75439453125, 3.1033935546875, 3.452392578125, 3.8013916015625, 4.150390625, 4.4993896484375, 4.848388671875, 5.1973876953125, 5.54638671875, 5.8953857421875, 6.244384765625, 6.5933837890625, 6.9423828125, 7.2913818359375, 7.640380859375, 7.9893798828125, 8.33837890625, 8.6873779296875, 9.036376953125, 9.3853759765625, 9.734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 15.0, 12.0, 15.0, 18.0, 21.0, 33.0, 30.0, 48.0, 53.0, 68.0, 72.0, 71.0, 69.0, 60.0, 56.0, 54.0, 59.0, 32.0, 35.0, 33.0, 29.0, 9.0, 12.0, 17.0, 6.0, 8.0, 7.0, 9.0, 5.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.818359375, -1.7715301513671875, -1.724700927734375, -1.6778717041015625, -1.63104248046875, -1.5842132568359375, -1.537384033203125, -1.4905548095703125, -1.4437255859375, -1.3968963623046875, -1.350067138671875, -1.3032379150390625, -1.25640869140625, -1.2095794677734375, -1.162750244140625, -1.1159210205078125, -1.069091796875, -1.0222625732421875, -0.975433349609375, -0.9286041259765625, -0.88177490234375, -0.8349456787109375, -0.788116455078125, -0.7412872314453125, -0.6944580078125, -0.6476287841796875, -0.600799560546875, -0.5539703369140625, -0.50714111328125, -0.4603118896484375, -0.413482666015625, -0.3666534423828125, -0.31982421875, -0.2729949951171875, -0.226165771484375, -0.1793365478515625, -0.13250732421875, -0.0856781005859375, -0.038848876953125, 0.0079803466796875, 0.0548095703125, 0.1016387939453125, 0.148468017578125, 0.1952972412109375, 0.24212646484375, 0.2889556884765625, 0.335784912109375, 0.3826141357421875, 0.429443359375, 0.4762725830078125, 0.523101806640625, 0.5699310302734375, 0.61676025390625, 0.6635894775390625, 0.710418701171875, 0.7572479248046875, 0.8040771484375, 0.8509063720703125, 0.897735595703125, 0.9445648193359375, 0.99139404296875, 1.0382232666015625, 1.085052490234375, 1.1318817138671875, 1.1787109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 2.0, 6.0, 11.0, 13.0, 29.0, 49.0, 83.0, 117.0, 75.0, 39.0, 18.0, 7.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.193470001220703, -8.796862602233887, -8.400256156921387, -8.00364875793457, -7.607041835784912, -7.210434913635254, -6.813827991485596, -6.4172210693359375, -6.020613670349121, -5.624006748199463, -5.227399826049805, -4.830792427062988, -4.43418550491333, -4.037578582763672, -3.6409716606140137, -3.2443645000457764, -2.8477578163146973, -2.451150894165039, -2.0545437335968018, -1.6579368114471436, -1.2613297700881958, -0.864722728729248, -0.46811580657958984, -0.07150864601135254, 0.32509827613830566, 0.7217053174972534, 1.1183123588562012, 1.5149192810058594, 1.9115263223648071, 2.308133363723755, 2.704740285873413, 3.1013474464416504, 3.4979543685913086, 3.894561290740967, 4.291168212890625, 4.687775611877441, 5.0843825340271, 5.480989456176758, 5.877596378326416, 6.274203300476074, 6.670810699462891, 7.067417621612549, 7.464024543762207, 7.860631942749023, 8.257238388061523, 8.65384578704834, 9.050453186035156, 9.447059631347656, 9.843666076660156, 10.240273475646973, 10.636879920959473, 11.033487319946289, 11.430093765258789, 11.826701164245605, 12.223308563232422, 12.619915008544922, 13.016522407531738, 13.413129806518555, 13.809736251831055, 14.206343650817871, 14.602950096130371, 14.999557495117188, 15.396163940429688, 15.792771339416504, 16.18937873840332]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 10.0, 23.0, 47.0, 64.0, 75.0, 73.0, 59.0, 33.0, 20.0, 9.0, 6.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668726921081543, -6.446429252624512, -6.224132061004639, -6.001834392547607, -5.779537200927734, -5.557239532470703, -5.334941864013672, -5.112644195556641, -4.890347003936768, -4.668049335479736, -4.445752143859863, -4.223454475402832, -4.001156806945801, -3.7788596153259277, -3.5565619468688965, -3.3342645168304443, -3.111967086791992, -2.88966965675354, -2.667372226715088, -2.4450745582580566, -2.2227771282196045, -2.0004796981811523, -1.7781821489334106, -1.555884599685669, -1.3335871696472168, -1.1112897396087646, -0.888992190361023, -0.666694700717926, -0.4443972110748291, -0.22209978103637695, 0.0001977682113647461, 0.22249531745910645, 0.4447932243347168, 0.6670907139778137, 0.8893882036209106, 1.1116857528686523, 1.3339831829071045, 1.5562806129455566, 1.7785781621932983, 2.00087571144104, 2.223173141479492, 2.4454705715179443, 2.6677680015563965, 2.8900656700134277, 3.11236310005188, 3.334660530090332, 3.5569581985473633, 3.7792556285858154, 4.001553058624268, 4.223850727081299, 4.446147918701172, 4.668445587158203, 4.890743255615234, 5.113040447235107, 5.335338115692139, 5.557635307312012, 5.779932975769043, 6.002230644226074, 6.224527835845947, 6.4468255043029785, 6.669122695922852, 6.891420364379883, 7.113718032836914, 7.336015701293945, 7.558312892913818]}, "eval/loss": 4.192998886108398, "eval/wer": 1.903669178897263, "eval/runtime": 786.9912, "eval/samples_per_second": 3.357, "eval/steps_per_second": 0.281, "train/train_runtime": 6714.5583, "train/train_samples_per_second": 4.25, "train/train_steps_per_second": 0.177, "train/total_flos": 0.0, "train/train_loss": 4.242165094268132} \ No newline at end of file