diff --git "a/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" "b/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.4469, "train/learning_rate": 0.000994, "train/epoch": 0.42, "train/global_step": 500, "_runtime": 2831, "_timestamp": 1646296287, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 168.0, 820.0, 25.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-918.9666748046875, -902.3575439453125, -885.7484130859375, -869.1392211914062, -852.5300903320312, -835.9209594726562, -819.3118286132812, -802.7026977539062, -786.093505859375, -769.484375, -752.875244140625, -736.2660522460938, -719.6569213867188, -703.0477905273438, -686.4386596679688, -669.8295288085938, -653.2203979492188, -636.6112670898438, -620.0021362304688, -603.3929443359375, -586.7838134765625, -570.1746826171875, -553.5655517578125, -536.9564208984375, -520.3472900390625, -503.7381591796875, -487.1289978027344, -470.5198669433594, -453.91070556640625, -437.30157470703125, -420.69244384765625, -404.08331298828125, -387.47418212890625, -370.86505126953125, -354.2558898925781, -337.6467590332031, -321.03759765625, -304.428466796875, -287.8193359375, -271.210205078125, -254.60104370117188, -237.9918975830078, -221.38275146484375, -204.77362060546875, -188.1644744873047, -171.55532836914062, -154.94619750976562, -138.33705139160156, -121.7279052734375, -105.11875915527344, -88.5096206665039, -71.90048217773438, -55.29133605957031, -38.68218994140625, -22.07305145263672, -5.4639129638671875, 11.145233154296875, 27.754375457763672, 44.36351776123047, 60.972660064697266, 77.58180236816406, 94.19094848632812, 110.80008697509766, 127.40922546386719, 144.01837158203125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 9.0, 7.0, 11.0, 6.0, 8.0, 17.0, 19.0, 23.0, 21.0, 27.0, 27.0, 29.0, 38.0, 41.0, 36.0, 46.0, 55.0, 37.0, 38.0, 65.0, 33.0, 40.0, 29.0, 41.0, 30.0, 35.0, 25.0, 29.0, 22.0, 22.0, 19.0, 21.0, 17.0, 20.0, 11.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.76666259765625, -101.8507308959961, -97.93479919433594, -94.01886749267578, -90.10293579101562, -86.18701171875, -82.27108001708984, -78.35514831542969, -74.43921661376953, -70.52328491210938, -66.60735321044922, -62.69142532348633, -58.77549362182617, -54.859561920166016, -50.943634033203125, -47.02770233154297, -43.11177062988281, -39.195838928222656, -35.2799072265625, -31.36397933959961, -27.448047637939453, -23.532115936279297, -19.616186141967773, -15.70025634765625, -11.784324645996094, -7.868393898010254, -3.952463150024414, -0.03653240203857422, 3.8793983459472656, 7.795330047607422, 11.711259841918945, 15.627189636230469, 19.543121337890625, 23.45905303955078, 27.374982833862305, 31.290912628173828, 35.206844329833984, 39.12277603149414, 43.03870391845703, 46.95463562011719, 50.870567321777344, 54.7864990234375, 58.702430725097656, 62.61835861206055, 66.53428649902344, 70.45022583007812, 74.36614990234375, 78.2820816040039, 82.19801330566406, 86.11394500732422, 90.02987670898438, 93.94580841064453, 97.86174011230469, 101.77766418457031, 105.69359588623047, 109.60952758789062, 113.52545928955078, 117.44139099121094, 121.3573226928711, 125.27325439453125, 129.18917846679688, 133.10511779785156, 137.0210418701172, 140.93698120117188, 144.8529052734375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 7.0, 8.0, 8.0, 14.0, 14.0, 16.0, 17.0, 22.0, 22.0, 33.0, 35.0, 39.0, 39.0, 41.0, 48.0, 38.0, 46.0, 54.0, 55.0, 34.0, 40.0, 32.0, 37.0, 30.0, 27.0, 25.0, 28.0, 27.0, 25.0, 15.0, 22.0, 20.0, 14.0, 12.0, 11.0, 6.0, 5.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.6533203125, -1.5970001220703125, -1.540679931640625, -1.4843597412109375, -1.42803955078125, -1.3717193603515625, -1.315399169921875, -1.2590789794921875, -1.2027587890625, -1.1464385986328125, -1.090118408203125, -1.0337982177734375, -0.97747802734375, -0.9211578369140625, -0.864837646484375, -0.8085174560546875, -0.752197265625, -0.6958770751953125, -0.639556884765625, -0.5832366943359375, -0.52691650390625, -0.4705963134765625, -0.414276123046875, -0.3579559326171875, -0.3016357421875, -0.2453155517578125, -0.188995361328125, -0.1326751708984375, -0.07635498046875, -0.0200347900390625, 0.036285400390625, 0.0926055908203125, 0.14892578125, 0.2052459716796875, 0.261566162109375, 0.3178863525390625, 0.37420654296875, 0.4305267333984375, 0.486846923828125, 0.5431671142578125, 0.5994873046875, 0.6558074951171875, 0.712127685546875, 0.7684478759765625, 0.82476806640625, 0.8810882568359375, 0.937408447265625, 0.9937286376953125, 1.050048828125, 1.1063690185546875, 1.162689208984375, 1.2190093994140625, 1.27532958984375, 1.3316497802734375, 1.387969970703125, 1.4442901611328125, 1.5006103515625, 1.5569305419921875, 1.613250732421875, 1.6695709228515625, 1.72589111328125, 1.7822113037109375, 1.838531494140625, 1.8948516845703125, 1.951171875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 11.0, 17.0, 16.0, 14.0, 34.0, 46.0, 48.0, 71.0, 117.0, 158.0, 226.0, 359.0, 501.0, 836.0, 1339.0, 2328.0, 5133.0, 15756.0, 130235.0, 3920517.0, 91580.0, 13951.0, 4766.0, 2216.0, 1331.0, 793.0, 560.0, 366.0, 255.0, 196.0, 143.0, 92.0, 56.0, 50.0, 43.0, 40.0, 20.0, 16.0, 11.0, 8.0, 9.0, 6.0, 4.0, 1.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.2421875, -14.7247314453125, -14.207275390625, -13.6898193359375, -13.17236328125, -12.6549072265625, -12.137451171875, -11.6199951171875, -11.1025390625, -10.5850830078125, -10.067626953125, -9.5501708984375, -9.03271484375, -8.5152587890625, -7.997802734375, -7.4803466796875, -6.962890625, -6.4454345703125, -5.927978515625, -5.4105224609375, -4.89306640625, -4.3756103515625, -3.858154296875, -3.3406982421875, -2.8232421875, -2.3057861328125, -1.788330078125, -1.2708740234375, -0.75341796875, -0.2359619140625, 0.281494140625, 0.7989501953125, 1.31640625, 1.8338623046875, 2.351318359375, 2.8687744140625, 3.38623046875, 3.9036865234375, 4.421142578125, 4.9385986328125, 5.4560546875, 5.9735107421875, 6.490966796875, 7.0084228515625, 7.52587890625, 8.0433349609375, 8.560791015625, 9.0782470703125, 9.595703125, 10.1131591796875, 10.630615234375, 11.1480712890625, 11.66552734375, 12.1829833984375, 12.700439453125, 13.2178955078125, 13.7353515625, 14.2528076171875, 14.770263671875, 15.2877197265625, 15.80517578125, 16.3226318359375, 16.840087890625, 17.3575439453125, 17.875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 12.0, 10.0, 10.0, 17.0, 26.0, 35.0, 52.0, 55.0, 86.0, 125.0, 170.0, 240.0, 410.0, 586.0, 673.0, 513.0, 331.0, 177.0, 120.0, 102.0, 82.0, 55.0, 36.0, 29.0, 19.0, 16.0, 11.0, 13.0, 8.0, 6.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.51556396484375, -6.2850341796875, -6.05450439453125, -5.823974609375, -5.59344482421875, -5.3629150390625, -5.13238525390625, -4.90185546875, -4.67132568359375, -4.4407958984375, -4.21026611328125, -3.979736328125, -3.74920654296875, -3.5186767578125, -3.28814697265625, -3.0576171875, -2.82708740234375, -2.5965576171875, -2.36602783203125, -2.135498046875, -1.90496826171875, -1.6744384765625, -1.44390869140625, -1.21337890625, -0.98284912109375, -0.7523193359375, -0.52178955078125, -0.291259765625, -0.06072998046875, 0.1697998046875, 0.40032958984375, 0.630859375, 0.86138916015625, 1.0919189453125, 1.32244873046875, 1.552978515625, 1.78350830078125, 2.0140380859375, 2.24456787109375, 2.47509765625, 2.70562744140625, 2.9361572265625, 3.16668701171875, 3.397216796875, 3.62774658203125, 3.8582763671875, 4.08880615234375, 4.3193359375, 4.54986572265625, 4.7803955078125, 5.01092529296875, 5.241455078125, 5.47198486328125, 5.7025146484375, 5.93304443359375, 6.16357421875, 6.39410400390625, 6.6246337890625, 6.85516357421875, 7.085693359375, 7.31622314453125, 7.5467529296875, 7.77728271484375, 8.0078125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 13.0, 11.0, 21.0, 23.0, 21.0, 35.0, 75.0, 108.0, 157.0, 271.0, 558.0, 1714.0, 21096.0, 4032250.0, 132839.0, 3295.0, 812.0, 355.0, 184.0, 140.0, 87.0, 75.0, 38.0, 23.0, 21.0, 17.0, 6.0, 9.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.805908203125, -33.83056640625, -32.855224609375, -31.8798828125, -30.904541015625, -29.92919921875, -28.953857421875, -27.978515625, -27.003173828125, -26.02783203125, -25.052490234375, -24.0771484375, -23.101806640625, -22.12646484375, -21.151123046875, -20.17578125, -19.200439453125, -18.22509765625, -17.249755859375, -16.2744140625, -15.299072265625, -14.32373046875, -13.348388671875, -12.373046875, -11.397705078125, -10.42236328125, -9.447021484375, -8.4716796875, -7.496337890625, -6.52099609375, -5.545654296875, -4.5703125, -3.594970703125, -2.61962890625, -1.644287109375, -0.6689453125, 0.306396484375, 1.28173828125, 2.257080078125, 3.232421875, 4.207763671875, 5.18310546875, 6.158447265625, 7.1337890625, 8.109130859375, 9.08447265625, 10.059814453125, 11.03515625, 12.010498046875, 12.98583984375, 13.961181640625, 14.9365234375, 15.911865234375, 16.88720703125, 17.862548828125, 18.837890625, 19.813232421875, 20.78857421875, 21.763916015625, 22.7392578125, 23.714599609375, 24.68994140625, 25.665283203125, 26.640625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 234.0, 774.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.5100555419922, -139.38560485839844, -131.26116943359375, -123.13671875, -115.01226806640625, -106.88782501220703, -98.76338195800781, -90.63893127441406, -82.51448822021484, -74.39004516601562, -66.26559448242188, -58.141151428222656, -50.01670455932617, -41.89225769042969, -33.76781463623047, -25.643367767333984, -17.5189208984375, -9.394474983215332, -1.270029067993164, 6.8544158935546875, 14.978862762451172, 23.103309631347656, 31.227752685546875, 39.35219955444336, 47.476646423339844, 55.60109329223633, 63.72554016113281, 71.84998321533203, 79.97442626953125, 88.098876953125, 96.22332000732422, 104.34776306152344, 112.47219848632812, 120.59664154052734, 128.72108459472656, 136.8455352783203, 144.96998596191406, 153.09442138671875, 161.2188720703125, 169.34332275390625, 177.4677734375, 185.59222412109375, 193.71665954589844, 201.8411102294922, 209.96556091308594, 218.08999633789062, 226.21444702148438, 234.33889770507812, 242.4633331298828, 250.58778381347656, 258.71221923828125, 266.836669921875, 274.96112060546875, 283.0855712890625, 291.21002197265625, 299.3344421386719, 307.4588928222656, 315.5833435058594, 323.7077941894531, 331.83221435546875, 339.9566650390625, 348.08111572265625, 356.20556640625, 364.33001708984375, 372.4544677734375]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 10.0, 16.0, 10.0, 18.0, 19.0, 24.0, 37.0, 25.0, 31.0, 28.0, 34.0, 31.0, 33.0, 43.0, 50.0, 37.0, 44.0, 42.0, 45.0, 45.0, 45.0, 40.0, 30.0, 39.0, 32.0, 26.0, 33.0, 27.0, 18.0, 17.0, 13.0, 8.0, 5.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.554351806640625, -27.680984497070312, -26.8076171875, -25.934249877929688, -25.060882568359375, -24.187515258789062, -23.31414794921875, -22.440778732299805, -21.567411422729492, -20.69404411315918, -19.820676803588867, -18.947309494018555, -18.073942184448242, -17.200572967529297, -16.327205657958984, -15.453838348388672, -14.580471992492676, -13.707104682922363, -12.83373737335205, -11.960369110107422, -11.08700180053711, -10.213634490966797, -9.340267181396484, -8.466899871826172, -7.593532085418701, -6.720164775848389, -5.846796989440918, -4.9734296798706055, -4.100062370300293, -3.2266945838928223, -2.3533272743225098, -1.479959487915039, -0.6065921783447266, 0.26677531003952026, 1.140142798423767, 2.013510227203369, 2.8868777751922607, 3.7602453231811523, 4.633612632751465, 5.5069804191589355, 6.380347728729248, 7.2537150382995605, 8.127082824707031, 9.000450134277344, 9.873817443847656, 10.747184753417969, 11.620552062988281, 12.49392032623291, 13.367287635803223, 14.240654945373535, 15.114022254943848, 15.987390518188477, 16.86075782775879, 17.7341251373291, 18.607492446899414, 19.480859756469727, 20.35422706604004, 21.22759437561035, 22.100961685180664, 22.974328994750977, 23.84769630432129, 24.721065521240234, 25.594432830810547, 26.46780014038086, 27.341167449951172]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 7.0, 4.0, 6.0, 13.0, 11.0, 24.0, 15.0, 16.0, 27.0, 35.0, 40.0, 41.0, 45.0, 46.0, 48.0, 43.0, 43.0, 43.0, 59.0, 40.0, 37.0, 39.0, 29.0, 37.0, 32.0, 33.0, 25.0, 24.0, 18.0, 17.0, 27.0, 13.0, 12.0, 9.0, 5.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7529296875, -1.6924285888671875, -1.631927490234375, -1.5714263916015625, -1.51092529296875, -1.4504241943359375, -1.389923095703125, -1.3294219970703125, -1.2689208984375, -1.2084197998046875, -1.147918701171875, -1.0874176025390625, -1.02691650390625, -0.9664154052734375, -0.905914306640625, -0.8454132080078125, -0.784912109375, -0.7244110107421875, -0.663909912109375, -0.6034088134765625, -0.54290771484375, -0.4824066162109375, -0.421905517578125, -0.3614044189453125, -0.3009033203125, -0.2404022216796875, -0.179901123046875, -0.1194000244140625, -0.05889892578125, 0.0016021728515625, 0.062103271484375, 0.1226043701171875, 0.18310546875, 0.2436065673828125, 0.304107666015625, 0.3646087646484375, 0.42510986328125, 0.4856109619140625, 0.546112060546875, 0.6066131591796875, 0.6671142578125, 0.7276153564453125, 0.788116455078125, 0.8486175537109375, 0.90911865234375, 0.9696197509765625, 1.030120849609375, 1.0906219482421875, 1.151123046875, 1.2116241455078125, 1.272125244140625, 1.3326263427734375, 1.39312744140625, 1.4536285400390625, 1.514129638671875, 1.5746307373046875, 1.6351318359375, 1.6956329345703125, 1.756134033203125, 1.8166351318359375, 1.87713623046875, 1.9376373291015625, 1.998138427734375, 2.0586395263671875, 2.119140625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 11.0, 16.0, 33.0, 39.0, 48.0, 56.0, 99.0, 157.0, 172.0, 282.0, 407.0, 577.0, 772.0, 1144.0, 1737.0, 2392.0, 3574.0, 5188.0, 7987.0, 11737.0, 17870.0, 27535.0, 43300.0, 69736.0, 117871.0, 283850.0, 188585.0, 96788.0, 58323.0, 36974.0, 23900.0, 15460.0, 10103.0, 6941.0, 4629.0, 3190.0, 2197.0, 1490.0, 1027.0, 684.0, 489.0, 348.0, 248.0, 175.0, 128.0, 89.0, 48.0, 50.0, 32.0, 21.0, 15.0, 14.0, 9.0, 2.0, 5.0, 1.0, 1.0], "bins": [-0.1842041015625, -0.17859268188476562, -0.17298126220703125, -0.16736984252929688, -0.1617584228515625, -0.15614700317382812, -0.15053558349609375, -0.14492416381835938, -0.139312744140625, -0.13370132446289062, -0.12808990478515625, -0.12247848510742188, -0.1168670654296875, -0.11125564575195312, -0.10564422607421875, -0.10003280639648438, -0.09442138671875, -0.08880996704101562, -0.08319854736328125, -0.07758712768554688, -0.0719757080078125, -0.06636428833007812, -0.06075286865234375, -0.055141448974609375, -0.049530029296875, -0.043918609619140625, -0.03830718994140625, -0.032695770263671875, -0.0270843505859375, -0.021472930908203125, -0.01586151123046875, -0.010250091552734375, -0.004638671875, 0.000972747802734375, 0.00658416748046875, 0.012195587158203125, 0.0178070068359375, 0.023418426513671875, 0.02902984619140625, 0.034641265869140625, 0.040252685546875, 0.045864105224609375, 0.05147552490234375, 0.057086944580078125, 0.0626983642578125, 0.06830978393554688, 0.07392120361328125, 0.07953262329101562, 0.08514404296875, 0.09075546264648438, 0.09636688232421875, 0.10197830200195312, 0.1075897216796875, 0.11320114135742188, 0.11881256103515625, 0.12442398071289062, 0.130035400390625, 0.13564682006835938, 0.14125823974609375, 0.14686965942382812, 0.1524810791015625, 0.15809249877929688, 0.16370391845703125, 0.16931533813476562, 0.1749267578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 4.0, 13.0, 11.0, 10.0, 17.0, 23.0, 22.0, 23.0, 28.0, 28.0, 25.0, 19.0, 36.0, 34.0, 38.0, 30.0, 50.0, 39.0, 1053.0, 53.0, 34.0, 35.0, 38.0, 36.0, 31.0, 39.0, 20.0, 31.0, 29.0, 18.0, 19.0, 17.0, 14.0, 12.0, 13.0, 10.0, 8.0, 9.0, 6.0, 7.0, 5.0, 3.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2074432373046875, -1.165863037109375, -1.1242828369140625, -1.08270263671875, -1.0411224365234375, -0.999542236328125, -0.9579620361328125, -0.9163818359375, -0.8748016357421875, -0.833221435546875, -0.7916412353515625, -0.75006103515625, -0.7084808349609375, -0.666900634765625, -0.6253204345703125, -0.583740234375, -0.5421600341796875, -0.500579833984375, -0.4589996337890625, -0.41741943359375, -0.3758392333984375, -0.334259033203125, -0.2926788330078125, -0.2510986328125, -0.2095184326171875, -0.167938232421875, -0.1263580322265625, -0.08477783203125, -0.0431976318359375, -0.001617431640625, 0.0399627685546875, 0.08154296875, 0.1231231689453125, 0.164703369140625, 0.2062835693359375, 0.24786376953125, 0.2894439697265625, 0.331024169921875, 0.3726043701171875, 0.4141845703125, 0.4557647705078125, 0.497344970703125, 0.5389251708984375, 0.58050537109375, 0.6220855712890625, 0.663665771484375, 0.7052459716796875, 0.746826171875, 0.7884063720703125, 0.829986572265625, 0.8715667724609375, 0.91314697265625, 0.9547271728515625, 0.996307373046875, 1.0378875732421875, 1.0794677734375, 1.1210479736328125, 1.162628173828125, 1.2042083740234375, 1.24578857421875, 1.2873687744140625, 1.328948974609375, 1.3705291748046875, 1.412109375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 17.0, 13.0, 25.0, 32.0, 44.0, 59.0, 84.0, 140.0, 190.0, 273.0, 400.0, 595.0, 757.0, 1177.0, 1700.0, 2475.0, 3649.0, 5453.0, 8310.0, 12708.0, 19953.0, 33203.0, 56444.0, 105038.0, 1340257.0, 260792.0, 100757.0, 54179.0, 31957.0, 19592.0, 12420.0, 8076.0, 5262.0, 3505.0, 2356.0, 1600.0, 1095.0, 818.0, 530.0, 348.0, 275.0, 168.0, 115.0, 100.0, 57.0, 51.0, 28.0, 18.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.09423828125, -0.09146404266357422, -0.08868980407714844, -0.08591556549072266, -0.08314132690429688, -0.0803670883178711, -0.07759284973144531, -0.07481861114501953, -0.07204437255859375, -0.06927013397216797, -0.06649589538574219, -0.0637216567993164, -0.060947418212890625, -0.058173179626464844, -0.05539894104003906, -0.05262470245361328, -0.0498504638671875, -0.04707622528076172, -0.04430198669433594, -0.041527748107910156, -0.038753509521484375, -0.035979270935058594, -0.03320503234863281, -0.03043079376220703, -0.02765655517578125, -0.02488231658935547, -0.022108078002929688, -0.019333839416503906, -0.016559600830078125, -0.013785362243652344, -0.011011123657226562, -0.008236885070800781, -0.005462646484375, -0.0026884078979492188, 8.58306884765625e-05, 0.0028600692749023438, 0.005634307861328125, 0.008408546447753906, 0.011182785034179688, 0.013957023620605469, 0.01673126220703125, 0.01950550079345703, 0.022279739379882812, 0.025053977966308594, 0.027828216552734375, 0.030602455139160156, 0.03337669372558594, 0.03615093231201172, 0.0389251708984375, 0.04169940948486328, 0.04447364807128906, 0.047247886657714844, 0.050022125244140625, 0.052796363830566406, 0.05557060241699219, 0.05834484100341797, 0.06111907958984375, 0.06389331817626953, 0.06666755676269531, 0.0694417953491211, 0.07221603393554688, 0.07499027252197266, 0.07776451110839844, 0.08053874969482422, 0.08331298828125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 13.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 17.0, 18.0, 22.0, 26.0, 26.0, 30.0, 37.0, 41.0, 71.0, 101.0, 152.0, 86.0, 46.0, 47.0, 34.0, 34.0, 23.0, 26.0, 27.0, 18.0, 15.0, 12.0, 6.0, 12.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.52587890625e-05, -1.4786608517169952e-05, -1.4314427971839905e-05, -1.3842247426509857e-05, -1.337006688117981e-05, -1.2897886335849762e-05, -1.2425705790519714e-05, -1.1953525245189667e-05, -1.1481344699859619e-05, -1.1009164154529572e-05, -1.0536983609199524e-05, -1.0064803063869476e-05, -9.592622518539429e-06, -9.120441973209381e-06, -8.648261427879333e-06, -8.176080882549286e-06, -7.703900337219238e-06, -7.231719791889191e-06, -6.759539246559143e-06, -6.2873587012290955e-06, -5.815178155899048e-06, -5.342997610569e-06, -4.870817065238953e-06, -4.398636519908905e-06, -3.926455974578857e-06, -3.45427542924881e-06, -2.982094883918762e-06, -2.5099143385887146e-06, -2.037733793258667e-06, -1.5655532479286194e-06, -1.0933727025985718e-06, -6.211921572685242e-07, -1.4901161193847656e-07, 3.2316893339157104e-07, 7.953494787216187e-07, 1.2675300240516663e-06, 1.7397105693817139e-06, 2.2118911147117615e-06, 2.684071660041809e-06, 3.1562522053718567e-06, 3.6284327507019043e-06, 4.100613296031952e-06, 4.5727938413619995e-06, 5.044974386692047e-06, 5.517154932022095e-06, 5.989335477352142e-06, 6.46151602268219e-06, 6.9336965680122375e-06, 7.405877113342285e-06, 7.878057658672333e-06, 8.35023820400238e-06, 8.822418749332428e-06, 9.294599294662476e-06, 9.766779839992523e-06, 1.023896038532257e-05, 1.0711140930652618e-05, 1.1183321475982666e-05, 1.1655502021312714e-05, 1.2127682566642761e-05, 1.2599863111972809e-05, 1.3072043657302856e-05, 1.3544224202632904e-05, 1.4016404747962952e-05, 1.4488585293293e-05, 1.4960765838623047e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 12.0, 11.0, 7.0, 17.0, 13.0, 17.0, 30.0, 28.0, 43.0, 45.0, 95.0, 99.0, 164.0, 265.0, 560.0, 16366.0, 1026955.0, 2557.0, 437.0, 237.0, 146.0, 110.0, 78.0, 40.0, 45.0, 36.0, 27.0, 19.0, 13.0, 13.0, 13.0, 3.0, 4.0, 7.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033473968505859375, -0.0003233402967453003, -0.00031194090843200684, -0.0003005415201187134, -0.0002891421318054199, -0.00027774274349212646, -0.000266343355178833, -0.00025494396686553955, -0.0002435445785522461, -0.00023214519023895264, -0.00022074580192565918, -0.00020934641361236572, -0.00019794702529907227, -0.0001865476369857788, -0.00017514824867248535, -0.0001637488603591919, -0.00015234947204589844, -0.00014095008373260498, -0.00012955069541931152, -0.00011815130710601807, -0.00010675191879272461, -9.535253047943115e-05, -8.39531421661377e-05, -7.255375385284424e-05, -6.115436553955078e-05, -4.9754977226257324e-05, -3.835558891296387e-05, -2.695620059967041e-05, -1.5556812286376953e-05, -4.157423973083496e-06, 7.241964340209961e-06, 1.8641352653503418e-05, 3.0040740966796875e-05, 4.144012928009033e-05, 5.283951759338379e-05, 6.423890590667725e-05, 7.56382942199707e-05, 8.703768253326416e-05, 9.843707084655762e-05, 0.00010983645915985107, 0.00012123584747314453, 0.000132635235786438, 0.00014403462409973145, 0.0001554340124130249, 0.00016683340072631836, 0.00017823278903961182, 0.00018963217735290527, 0.00020103156566619873, 0.0002124309539794922, 0.00022383034229278564, 0.0002352297306060791, 0.00024662911891937256, 0.000258028507232666, 0.00026942789554595947, 0.00028082728385925293, 0.0002922266721725464, 0.00030362606048583984, 0.0003150254487991333, 0.00032642483711242676, 0.0003378242254257202, 0.00034922361373901367, 0.00036062300205230713, 0.0003720223903656006, 0.00038342177867889404, 0.0003948211669921875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 32.0, 200.0, 569.0, 161.0, 30.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.788917405880056e-05, -5.67844181205146e-05, -5.567966218222864e-05, -5.457490624394268e-05, -5.3470150305656716e-05, -5.2365394367370754e-05, -5.126063842908479e-05, -5.015588249079883e-05, -4.905112655251287e-05, -4.794637061422691e-05, -4.6841614675940946e-05, -4.5736858737654984e-05, -4.463210279936902e-05, -4.352734686108306e-05, -4.24225909227971e-05, -4.131783498451114e-05, -4.021307540824637e-05, -3.9108319469960406e-05, -3.8003563531674445e-05, -3.689880759338848e-05, -3.579405165510252e-05, -3.468929571681656e-05, -3.35845397785306e-05, -3.2479783840244636e-05, -3.1375027901958674e-05, -3.0270271963672712e-05, -2.916551602538675e-05, -2.806076008710079e-05, -2.6956004148814827e-05, -2.5851248210528865e-05, -2.4746492272242904e-05, -2.3641736333956942e-05, -2.2536982214660384e-05, -2.1432226276374422e-05, -2.032747033808846e-05, -1.92227143998025e-05, -1.8117958461516537e-05, -1.7013202523230575e-05, -1.590844476595521e-05, -1.480368973716395e-05, -1.3698933798877988e-05, -1.2594177860592026e-05, -1.1489421922306065e-05, -1.0384665074525401e-05, -9.27990913623944e-06, -8.175153197953478e-06, -7.070397259667516e-06, -5.965641321381554e-06, -4.860885383095592e-06, -3.7561294448096305e-06, -2.6513732791499933e-06, -1.5466171134903561e-06, -4.418611752043944e-07, 6.628947630815674e-07, 1.76765115611488e-06, 2.8724070944008417e-06, 3.9771630326868035e-06, 5.081918970972765e-06, 6.186674909258727e-06, 7.29143130229204e-06, 8.396187695325352e-06, 9.500943633611314e-06, 1.0605699571897276e-05, 1.1710455510183237e-05, 1.28152114484692e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 4.0, 7.0, 9.0, 8.0, 8.0, 9.0, 9.0, 14.0, 13.0, 25.0, 18.0, 26.0, 24.0, 28.0, 32.0, 37.0, 28.0, 41.0, 44.0, 47.0, 55.0, 30.0, 45.0, 37.0, 50.0, 38.0, 39.0, 29.0, 20.0, 41.0, 21.0, 24.0, 22.0, 17.0, 15.0, 13.0, 17.0, 8.0, 5.0, 9.0, 6.0, 10.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.033348083496094e-06, -6.806105375289917e-06, -6.57886266708374e-06, -6.3516199588775635e-06, -6.124377250671387e-06, -5.89713454246521e-06, -5.669891834259033e-06, -5.4426491260528564e-06, -5.21540641784668e-06, -4.988163709640503e-06, -4.760921001434326e-06, -4.533678293228149e-06, -4.306435585021973e-06, -4.079192876815796e-06, -3.851950168609619e-06, -3.6247074604034424e-06, -3.3974647521972656e-06, -3.170222043991089e-06, -2.942979335784912e-06, -2.7157366275787354e-06, -2.4884939193725586e-06, -2.261251211166382e-06, -2.034008502960205e-06, -1.8067657947540283e-06, -1.5795230865478516e-06, -1.3522803783416748e-06, -1.125037670135498e-06, -8.977949619293213e-07, -6.705522537231445e-07, -4.4330954551696777e-07, -2.1606683731079102e-07, 1.1175870895385742e-08, 2.384185791015625e-07, 4.6566128730773926e-07, 6.92903995513916e-07, 9.201467037200928e-07, 1.1473894119262695e-06, 1.3746321201324463e-06, 1.601874828338623e-06, 1.8291175365447998e-06, 2.0563602447509766e-06, 2.2836029529571533e-06, 2.51084566116333e-06, 2.738088369369507e-06, 2.9653310775756836e-06, 3.1925737857818604e-06, 3.419816493988037e-06, 3.647059202194214e-06, 3.874301910400391e-06, 4.101544618606567e-06, 4.328787326812744e-06, 4.556030035018921e-06, 4.783272743225098e-06, 5.010515451431274e-06, 5.237758159637451e-06, 5.465000867843628e-06, 5.692243576049805e-06, 5.9194862842559814e-06, 6.146728992462158e-06, 6.373971700668335e-06, 6.601214408874512e-06, 6.8284571170806885e-06, 7.055699825286865e-06, 7.282942533493042e-06, 7.510185241699219e-06]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 7.0, 4.0, 6.0, 13.0, 11.0, 24.0, 15.0, 16.0, 27.0, 35.0, 40.0, 41.0, 45.0, 46.0, 48.0, 43.0, 43.0, 43.0, 59.0, 40.0, 37.0, 39.0, 29.0, 37.0, 32.0, 33.0, 25.0, 24.0, 18.0, 17.0, 27.0, 13.0, 12.0, 9.0, 5.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7529296875, -1.6924285888671875, -1.631927490234375, -1.5714263916015625, -1.51092529296875, -1.4504241943359375, -1.389923095703125, -1.3294219970703125, -1.2689208984375, -1.2084197998046875, -1.147918701171875, -1.0874176025390625, -1.02691650390625, -0.9664154052734375, -0.905914306640625, -0.8454132080078125, -0.784912109375, -0.7244110107421875, -0.663909912109375, -0.6034088134765625, -0.54290771484375, -0.4824066162109375, -0.421905517578125, -0.3614044189453125, -0.3009033203125, -0.2404022216796875, -0.179901123046875, -0.1194000244140625, -0.05889892578125, 0.0016021728515625, 0.062103271484375, 0.1226043701171875, 0.18310546875, 0.2436065673828125, 0.304107666015625, 0.3646087646484375, 0.42510986328125, 0.4856109619140625, 0.546112060546875, 0.6066131591796875, 0.6671142578125, 0.7276153564453125, 0.788116455078125, 0.8486175537109375, 0.90911865234375, 0.9696197509765625, 1.030120849609375, 1.0906219482421875, 1.151123046875, 1.2116241455078125, 1.272125244140625, 1.3326263427734375, 1.39312744140625, 1.4536285400390625, 1.514129638671875, 1.5746307373046875, 1.6351318359375, 1.6956329345703125, 1.756134033203125, 1.8166351318359375, 1.87713623046875, 1.9376373291015625, 1.998138427734375, 2.0586395263671875, 2.119140625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 10.0, 6.0, 13.0, 16.0, 31.0, 31.0, 45.0, 72.0, 108.0, 122.0, 164.0, 230.0, 344.0, 463.0, 640.0, 833.0, 1274.0, 1993.0, 3010.0, 5429.0, 12311.0, 44171.0, 485495.0, 423633.0, 41656.0, 11794.0, 5358.0, 2999.0, 1902.0, 1192.0, 882.0, 624.0, 457.0, 346.0, 255.0, 170.0, 131.0, 89.0, 56.0, 46.0, 52.0, 21.0, 21.0, 17.0, 16.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.879150390625, -14.39892578125, -13.918701171875, -13.4384765625, -12.958251953125, -12.47802734375, -11.997802734375, -11.517578125, -11.037353515625, -10.55712890625, -10.076904296875, -9.5966796875, -9.116455078125, -8.63623046875, -8.156005859375, -7.67578125, -7.195556640625, -6.71533203125, -6.235107421875, -5.7548828125, -5.274658203125, -4.79443359375, -4.314208984375, -3.833984375, -3.353759765625, -2.87353515625, -2.393310546875, -1.9130859375, -1.432861328125, -0.95263671875, -0.472412109375, 0.0078125, 0.488037109375, 0.96826171875, 1.448486328125, 1.9287109375, 2.408935546875, 2.88916015625, 3.369384765625, 3.849609375, 4.329833984375, 4.81005859375, 5.290283203125, 5.7705078125, 6.250732421875, 6.73095703125, 7.211181640625, 7.69140625, 8.171630859375, 8.65185546875, 9.132080078125, 9.6123046875, 10.092529296875, 10.57275390625, 11.052978515625, 11.533203125, 12.013427734375, 12.49365234375, 12.973876953125, 13.4541015625, 13.934326171875, 14.41455078125, 14.894775390625, 15.375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 7.0, 3.0, 4.0, 6.0, 9.0, 5.0, 10.0, 13.0, 12.0, 19.0, 23.0, 30.0, 16.0, 20.0, 24.0, 32.0, 31.0, 39.0, 44.0, 43.0, 54.0, 62.0, 121.0, 1492.0, 284.0, 119.0, 73.0, 43.0, 53.0, 39.0, 32.0, 38.0, 32.0, 33.0, 31.0, 19.0, 19.0, 17.0, 27.0, 16.0, 11.0, 9.0, 9.0, 11.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0], "bins": [-6.3515625, -6.169921875, -5.98828125, -5.806640625, -5.625, -5.443359375, -5.26171875, -5.080078125, -4.8984375, -4.716796875, -4.53515625, -4.353515625, -4.171875, -3.990234375, -3.80859375, -3.626953125, -3.4453125, -3.263671875, -3.08203125, -2.900390625, -2.71875, -2.537109375, -2.35546875, -2.173828125, -1.9921875, -1.810546875, -1.62890625, -1.447265625, -1.265625, -1.083984375, -0.90234375, -0.720703125, -0.5390625, -0.357421875, -0.17578125, 0.005859375, 0.1875, 0.369140625, 0.55078125, 0.732421875, 0.9140625, 1.095703125, 1.27734375, 1.458984375, 1.640625, 1.822265625, 2.00390625, 2.185546875, 2.3671875, 2.548828125, 2.73046875, 2.912109375, 3.09375, 3.275390625, 3.45703125, 3.638671875, 3.8203125, 4.001953125, 4.18359375, 4.365234375, 4.546875, 4.728515625, 4.91015625, 5.091796875, 5.2734375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 10.0, 10.0, 4.0, 11.0, 23.0, 12.0, 16.0, 18.0, 31.0, 18.0, 30.0, 36.0, 63.0, 60.0, 126.0, 295.0, 819.0, 3649.0, 31295.0, 3014957.0, 86075.0, 6081.0, 1179.0, 344.0, 146.0, 86.0, 52.0, 47.0, 25.0, 26.0, 22.0, 18.0, 17.0, 19.0, 11.0, 7.0, 14.0, 6.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.55615234375, -21.7685546875, -20.98095703125, -20.193359375, -19.40576171875, -18.6181640625, -17.83056640625, -17.04296875, -16.25537109375, -15.4677734375, -14.68017578125, -13.892578125, -13.10498046875, -12.3173828125, -11.52978515625, -10.7421875, -9.95458984375, -9.1669921875, -8.37939453125, -7.591796875, -6.80419921875, -6.0166015625, -5.22900390625, -4.44140625, -3.65380859375, -2.8662109375, -2.07861328125, -1.291015625, -0.50341796875, 0.2841796875, 1.07177734375, 1.859375, 2.64697265625, 3.4345703125, 4.22216796875, 5.009765625, 5.79736328125, 6.5849609375, 7.37255859375, 8.16015625, 8.94775390625, 9.7353515625, 10.52294921875, 11.310546875, 12.09814453125, 12.8857421875, 13.67333984375, 14.4609375, 15.24853515625, 16.0361328125, 16.82373046875, 17.611328125, 18.39892578125, 19.1865234375, 19.97412109375, 20.76171875, 21.54931640625, 22.3369140625, 23.12451171875, 23.912109375, 24.69970703125, 25.4873046875, 26.27490234375, 27.0625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 19.0, 75.0, 286.0, 348.0, 184.0, 60.0, 18.0, 10.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.820045471191406, -7.368402481079102, -5.916759490966797, -4.465116500854492, -3.0134735107421875, -1.5618305206298828, -0.11018753051757812, 1.3414554595947266, 2.7930984497070312, 4.244741439819336, 5.696384429931641, 7.148027420043945, 8.59967041015625, 10.051313400268555, 11.50295639038086, 12.954599380493164, 14.406242370605469, 15.857885360717773, 17.309528350830078, 18.761171340942383, 20.212814331054688, 21.664457321166992, 23.116100311279297, 24.5677433013916, 26.019386291503906, 27.47102928161621, 28.922672271728516, 30.37431526184082, 31.825958251953125, 33.27760314941406, 34.729244232177734, 36.180885314941406, 37.632530212402344, 39.08417510986328, 40.53581619262695, 41.987457275390625, 43.43910217285156, 44.8907470703125, 46.34238815307617, 47.794029235839844, 49.24567413330078, 50.69731903076172, 52.14896011352539, 53.60060119628906, 55.05224609375, 56.50389099121094, 57.95553207397461, 59.40717315673828, 60.85881805419922, 62.310462951660156, 63.76210403442383, 65.2137451171875, 66.66539001464844, 68.11703491210938, 69.56867980957031, 71.02031707763672, 72.47196197509766, 73.9236068725586, 75.375244140625, 76.82688903808594, 78.27853393554688, 79.73017883300781, 81.18182373046875, 82.63346099853516, 84.0851058959961]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 0.0, 4.0, 7.0, 7.0, 5.0, 8.0, 9.0, 14.0, 12.0, 20.0, 15.0, 21.0, 20.0, 32.0, 29.0, 36.0, 33.0, 36.0, 34.0, 38.0, 38.0, 34.0, 38.0, 52.0, 33.0, 44.0, 39.0, 38.0, 46.0, 34.0, 22.0, 26.0, 28.0, 24.0, 23.0, 22.0, 15.0, 19.0, 8.0, 8.0, 8.0, 6.0, 2.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-28.412071228027344, -27.595428466796875, -26.77878761291504, -25.96214485168457, -25.145503997802734, -24.328861236572266, -23.512218475341797, -22.69557762145996, -21.878936767578125, -21.062294006347656, -20.24565315246582, -19.42901039123535, -18.612369537353516, -17.795726776123047, -16.979084014892578, -16.162443161010742, -15.345800399780273, -14.529158592224121, -13.712516784667969, -12.8958740234375, -12.079233169555664, -11.262590408325195, -10.445948600769043, -9.62930679321289, -8.812664985656738, -7.996023178100586, -7.179381370544434, -6.362739086151123, -5.546097278594971, -4.729455471038818, -3.912813186645508, -3.0961713790893555, -2.279529571533203, -1.4628876447677612, -0.6462457180023193, 0.1703963279724121, 0.9870381355285645, 1.8036799430847168, 2.6203222274780273, 3.4369640350341797, 4.253605842590332, 5.070247650146484, 5.886889457702637, 6.703531742095947, 7.5201735496521, 8.336814880371094, 9.153457641601562, 9.970099449157715, 10.786741256713867, 11.60338306427002, 12.420024871826172, 13.23666763305664, 14.053308486938477, 14.869951248168945, 15.686593055725098, 16.50323486328125, 17.31987762451172, 18.136520385742188, 18.953161239624023, 19.769804000854492, 20.586444854736328, 21.403087615966797, 22.219730377197266, 23.0363712310791, 23.853012084960938]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 5.0, 15.0, 15.0, 9.0, 17.0, 24.0, 22.0, 35.0, 35.0, 42.0, 40.0, 48.0, 39.0, 50.0, 39.0, 54.0, 41.0, 53.0, 37.0, 37.0, 36.0, 41.0, 29.0, 31.0, 29.0, 21.0, 21.0, 21.0, 16.0, 22.0, 14.0, 8.0, 2.0, 8.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6962890625, -1.6341094970703125, -1.571929931640625, -1.5097503662109375, -1.44757080078125, -1.3853912353515625, -1.323211669921875, -1.2610321044921875, -1.1988525390625, -1.1366729736328125, -1.074493408203125, -1.0123138427734375, -0.95013427734375, -0.8879547119140625, -0.825775146484375, -0.7635955810546875, -0.701416015625, -0.6392364501953125, -0.577056884765625, -0.5148773193359375, -0.45269775390625, -0.3905181884765625, -0.328338623046875, -0.2661590576171875, -0.2039794921875, -0.1417999267578125, -0.079620361328125, -0.0174407958984375, 0.04473876953125, 0.1069183349609375, 0.169097900390625, 0.2312774658203125, 0.29345703125, 0.3556365966796875, 0.417816162109375, 0.4799957275390625, 0.54217529296875, 0.6043548583984375, 0.666534423828125, 0.7287139892578125, 0.7908935546875, 0.8530731201171875, 0.915252685546875, 0.9774322509765625, 1.03961181640625, 1.1017913818359375, 1.163970947265625, 1.2261505126953125, 1.288330078125, 1.3505096435546875, 1.412689208984375, 1.4748687744140625, 1.53704833984375, 1.5992279052734375, 1.661407470703125, 1.7235870361328125, 1.7857666015625, 1.8479461669921875, 1.910125732421875, 1.9723052978515625, 2.03448486328125, 2.0966644287109375, 2.158843994140625, 2.2210235595703125, 2.283203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 3.0, 2.0, 6.0, 2.0, 8.0, 9.0, 26.0, 14.0, 36.0, 38.0, 49.0, 84.0, 141.0, 194.0, 318.0, 623.0, 1118.0, 3589.0, 30414.0, 3073253.0, 1059847.0, 18980.0, 2933.0, 1048.0, 533.0, 337.0, 192.0, 142.0, 84.0, 76.0, 45.0, 27.0, 24.0, 30.0, 14.0, 11.0, 12.0, 4.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.953125, -18.297607421875, -17.64208984375, -16.986572265625, -16.3310546875, -15.675537109375, -15.02001953125, -14.364501953125, -13.708984375, -13.053466796875, -12.39794921875, -11.742431640625, -11.0869140625, -10.431396484375, -9.77587890625, -9.120361328125, -8.46484375, -7.809326171875, -7.15380859375, -6.498291015625, -5.8427734375, -5.187255859375, -4.53173828125, -3.876220703125, -3.220703125, -2.565185546875, -1.90966796875, -1.254150390625, -0.5986328125, 0.056884765625, 0.71240234375, 1.367919921875, 2.0234375, 2.678955078125, 3.33447265625, 3.989990234375, 4.6455078125, 5.301025390625, 5.95654296875, 6.612060546875, 7.267578125, 7.923095703125, 8.57861328125, 9.234130859375, 9.8896484375, 10.545166015625, 11.20068359375, 11.856201171875, 12.51171875, 13.167236328125, 13.82275390625, 14.478271484375, 15.1337890625, 15.789306640625, 16.44482421875, 17.100341796875, 17.755859375, 18.411376953125, 19.06689453125, 19.722412109375, 20.3779296875, 21.033447265625, 21.68896484375, 22.344482421875, 23.0]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 8.0, 14.0, 22.0, 27.0, 41.0, 46.0, 67.0, 88.0, 129.0, 194.0, 251.0, 358.0, 498.0, 581.0, 499.0, 341.0, 257.0, 163.0, 130.0, 93.0, 74.0, 40.0, 29.0, 28.0, 20.0, 13.0, 11.0, 7.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-7.6484375, -7.43902587890625, -7.2296142578125, -7.02020263671875, -6.810791015625, -6.60137939453125, -6.3919677734375, -6.18255615234375, -5.97314453125, -5.76373291015625, -5.5543212890625, -5.34490966796875, -5.135498046875, -4.92608642578125, -4.7166748046875, -4.50726318359375, -4.2978515625, -4.08843994140625, -3.8790283203125, -3.66961669921875, -3.460205078125, -3.25079345703125, -3.0413818359375, -2.83197021484375, -2.62255859375, -2.41314697265625, -2.2037353515625, -1.99432373046875, -1.784912109375, -1.57550048828125, -1.3660888671875, -1.15667724609375, -0.947265625, -0.73785400390625, -0.5284423828125, -0.31903076171875, -0.109619140625, 0.09979248046875, 0.3092041015625, 0.51861572265625, 0.72802734375, 0.93743896484375, 1.1468505859375, 1.35626220703125, 1.565673828125, 1.77508544921875, 1.9844970703125, 2.19390869140625, 2.4033203125, 2.61273193359375, 2.8221435546875, 3.03155517578125, 3.240966796875, 3.45037841796875, 3.6597900390625, 3.86920166015625, 4.07861328125, 4.28802490234375, 4.4974365234375, 4.70684814453125, 4.916259765625, 5.12567138671875, 5.3350830078125, 5.54449462890625, 5.75390625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 8.0, 5.0, 11.0, 24.0, 27.0, 63.0, 110.0, 148.0, 376.0, 799.0, 2709.0, 16740.0, 310075.0, 3674336.0, 173686.0, 11605.0, 2154.0, 685.0, 312.0, 174.0, 76.0, 60.0, 33.0, 21.0, 21.0, 8.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.703125, -26.008056640625, -25.31298828125, -24.617919921875, -23.9228515625, -23.227783203125, -22.53271484375, -21.837646484375, -21.142578125, -20.447509765625, -19.75244140625, -19.057373046875, -18.3623046875, -17.667236328125, -16.97216796875, -16.277099609375, -15.58203125, -14.886962890625, -14.19189453125, -13.496826171875, -12.8017578125, -12.106689453125, -11.41162109375, -10.716552734375, -10.021484375, -9.326416015625, -8.63134765625, -7.936279296875, -7.2412109375, -6.546142578125, -5.85107421875, -5.156005859375, -4.4609375, -3.765869140625, -3.07080078125, -2.375732421875, -1.6806640625, -0.985595703125, -0.29052734375, 0.404541015625, 1.099609375, 1.794677734375, 2.48974609375, 3.184814453125, 3.8798828125, 4.574951171875, 5.27001953125, 5.965087890625, 6.66015625, 7.355224609375, 8.05029296875, 8.745361328125, 9.4404296875, 10.135498046875, 10.83056640625, 11.525634765625, 12.220703125, 12.915771484375, 13.61083984375, 14.305908203125, 15.0009765625, 15.696044921875, 16.39111328125, 17.086181640625, 17.78125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 10.0, 19.0, 41.0, 78.0, 112.0, 140.0, 166.0, 162.0, 106.0, 84.0, 48.0, 22.0, 11.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.060543060302734, -38.82929611206055, -37.598052978515625, -36.36680603027344, -35.13555908203125, -33.90431213378906, -32.67306900024414, -31.441822052001953, -30.2105770111084, -28.979331970214844, -27.748085021972656, -26.5168399810791, -25.285594940185547, -24.05434799194336, -22.823102951049805, -21.59185791015625, -20.360610961914062, -19.129365921020508, -17.89811897277832, -16.666873931884766, -15.435627937316895, -14.204381942749023, -12.973136901855469, -11.741890907287598, -10.510644912719727, -9.279398918151855, -8.048152923583984, -6.81690788269043, -5.585661888122559, -4.3544158935546875, -3.1231703758239746, -1.8919248580932617, -0.6606788635253906, 0.5705668926239014, 1.8018126487731934, 3.0330584049224854, 4.264304161071777, 5.495550155639648, 6.726795673370361, 7.958041191101074, 9.189287185668945, 10.420533180236816, 11.651779174804688, 12.883024215698242, 14.114270210266113, 15.345516204833984, 16.57676124572754, 17.808006286621094, 19.03925323486328, 20.270498275756836, 21.501745223999023, 22.732990264892578, 23.964237213134766, 25.19548225402832, 26.426727294921875, 27.657974243164062, 28.889219284057617, 30.120464324951172, 31.35171127319336, 32.58295822143555, 33.81420135498047, 35.045448303222656, 36.276695251464844, 37.507938385009766, 38.73918533325195]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 10.0, 4.0, 4.0, 7.0, 9.0, 9.0, 14.0, 17.0, 21.0, 18.0, 29.0, 23.0, 21.0, 25.0, 30.0, 37.0, 23.0, 41.0, 39.0, 31.0, 46.0, 35.0, 38.0, 38.0, 30.0, 36.0, 41.0, 33.0, 39.0, 27.0, 30.0, 36.0, 26.0, 23.0, 12.0, 17.0, 17.0, 24.0, 5.0, 15.0, 5.0, 1.0, 6.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.756263732910156, -24.08721160888672, -23.41815948486328, -22.749107360839844, -22.080055236816406, -21.41100311279297, -20.74195098876953, -20.072898864746094, -19.403846740722656, -18.73479461669922, -18.06574249267578, -17.396690368652344, -16.727638244628906, -16.05858612060547, -15.389534950256348, -14.72048282623291, -14.051431655883789, -13.382379531860352, -12.713327407836914, -12.044275283813477, -11.375223159790039, -10.706171035766602, -10.03711986541748, -9.368067741394043, -8.699015617370605, -8.029963493347168, -7.3609113693237305, -6.691859722137451, -6.022807598114014, -5.353755474090576, -4.684703826904297, -4.015651702880859, -3.346599578857422, -2.6775474548339844, -2.008495569229126, -1.3394436836242676, -0.6703915596008301, -0.0013394355773925781, 0.6677122116088867, 1.3367643356323242, 2.0058164596557617, 2.674868583679199, 3.3439204692840576, 4.012972354888916, 4.6820244789123535, 5.351076602935791, 6.02012825012207, 6.689180374145508, 7.358232498168945, 8.027284622192383, 8.69633674621582, 9.365388870239258, 10.034440994262695, 10.703493118286133, 11.372544288635254, 12.041596412658691, 12.710648536682129, 13.379700660705566, 14.048752784729004, 14.717803955078125, 15.386856079101562, 16.055908203125, 16.724960327148438, 17.394012451171875, 18.063064575195312]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 5.0, 10.0, 3.0, 6.0, 20.0, 13.0, 18.0, 23.0, 17.0, 35.0, 43.0, 40.0, 38.0, 39.0, 30.0, 45.0, 48.0, 48.0, 46.0, 36.0, 44.0, 32.0, 28.0, 49.0, 26.0, 36.0, 32.0, 29.0, 22.0, 16.0, 13.0, 17.0, 16.0, 14.0, 13.0, 11.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.728515625, -1.66839599609375, -1.6082763671875, -1.54815673828125, -1.488037109375, -1.42791748046875, -1.3677978515625, -1.30767822265625, -1.24755859375, -1.18743896484375, -1.1273193359375, -1.06719970703125, -1.007080078125, -0.94696044921875, -0.8868408203125, -0.82672119140625, -0.7666015625, -0.70648193359375, -0.6463623046875, -0.58624267578125, -0.526123046875, -0.46600341796875, -0.4058837890625, -0.34576416015625, -0.28564453125, -0.22552490234375, -0.1654052734375, -0.10528564453125, -0.045166015625, 0.01495361328125, 0.0750732421875, 0.13519287109375, 0.1953125, 0.25543212890625, 0.3155517578125, 0.37567138671875, 0.435791015625, 0.49591064453125, 0.5560302734375, 0.61614990234375, 0.67626953125, 0.73638916015625, 0.7965087890625, 0.85662841796875, 0.916748046875, 0.97686767578125, 1.0369873046875, 1.09710693359375, 1.1572265625, 1.21734619140625, 1.2774658203125, 1.33758544921875, 1.397705078125, 1.45782470703125, 1.5179443359375, 1.57806396484375, 1.63818359375, 1.69830322265625, 1.7584228515625, 1.81854248046875, 1.878662109375, 1.93878173828125, 1.9989013671875, 2.05902099609375, 2.119140625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 3.0, 11.0, 10.0, 5.0, 21.0, 15.0, 19.0, 46.0, 55.0, 72.0, 113.0, 127.0, 200.0, 261.0, 391.0, 530.0, 780.0, 1095.0, 1469.0, 2218.0, 3256.0, 4850.0, 7088.0, 10824.0, 16740.0, 26458.0, 42659.0, 70324.0, 132116.0, 341111.0, 167019.0, 82999.0, 48934.0, 30120.0, 19159.0, 12234.0, 7944.0, 5445.0, 3626.0, 2458.0, 1727.0, 1212.0, 813.0, 598.0, 399.0, 278.0, 214.0, 143.0, 114.0, 73.0, 67.0, 35.0, 27.0, 22.0, 12.0, 9.0, 10.0, 1.0, 3.0, 1.0, 4.0], "bins": [-0.186279296875, -0.180572509765625, -0.17486572265625, -0.169158935546875, -0.1634521484375, -0.157745361328125, -0.15203857421875, -0.146331787109375, -0.140625, -0.134918212890625, -0.12921142578125, -0.123504638671875, -0.1177978515625, -0.112091064453125, -0.10638427734375, -0.100677490234375, -0.094970703125, -0.089263916015625, -0.08355712890625, -0.077850341796875, -0.0721435546875, -0.066436767578125, -0.06072998046875, -0.055023193359375, -0.04931640625, -0.043609619140625, -0.03790283203125, -0.032196044921875, -0.0264892578125, -0.020782470703125, -0.01507568359375, -0.009368896484375, -0.003662109375, 0.002044677734375, 0.00775146484375, 0.013458251953125, 0.0191650390625, 0.024871826171875, 0.03057861328125, 0.036285400390625, 0.0419921875, 0.047698974609375, 0.05340576171875, 0.059112548828125, 0.0648193359375, 0.070526123046875, 0.07623291015625, 0.081939697265625, 0.087646484375, 0.093353271484375, 0.09906005859375, 0.104766845703125, 0.1104736328125, 0.116180419921875, 0.12188720703125, 0.127593994140625, 0.13330078125, 0.139007568359375, 0.14471435546875, 0.150421142578125, 0.1561279296875, 0.161834716796875, 0.16754150390625, 0.173248291015625, 0.178955078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 7.0, 7.0, 2.0, 5.0, 7.0, 10.0, 8.0, 14.0, 18.0, 25.0, 20.0, 22.0, 35.0, 40.0, 22.0, 43.0, 45.0, 35.0, 40.0, 50.0, 46.0, 1066.0, 44.0, 55.0, 35.0, 28.0, 33.0, 26.0, 38.0, 24.0, 20.0, 26.0, 28.0, 12.0, 22.0, 18.0, 7.0, 7.0, 16.0, 8.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.337005615234375, -1.29022216796875, -1.243438720703125, -1.1966552734375, -1.149871826171875, -1.10308837890625, -1.056304931640625, -1.009521484375, -0.962738037109375, -0.91595458984375, -0.869171142578125, -0.8223876953125, -0.775604248046875, -0.72882080078125, -0.682037353515625, -0.63525390625, -0.588470458984375, -0.54168701171875, -0.494903564453125, -0.4481201171875, -0.401336669921875, -0.35455322265625, -0.307769775390625, -0.260986328125, -0.214202880859375, -0.16741943359375, -0.120635986328125, -0.0738525390625, -0.027069091796875, 0.01971435546875, 0.066497802734375, 0.11328125, 0.160064697265625, 0.20684814453125, 0.253631591796875, 0.3004150390625, 0.347198486328125, 0.39398193359375, 0.440765380859375, 0.487548828125, 0.534332275390625, 0.58111572265625, 0.627899169921875, 0.6746826171875, 0.721466064453125, 0.76824951171875, 0.815032958984375, 0.86181640625, 0.908599853515625, 0.95538330078125, 1.002166748046875, 1.0489501953125, 1.095733642578125, 1.14251708984375, 1.189300537109375, 1.236083984375, 1.282867431640625, 1.32965087890625, 1.376434326171875, 1.4232177734375, 1.470001220703125, 1.51678466796875, 1.563568115234375, 1.6103515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 9.0, 10.0, 17.0, 14.0, 21.0, 28.0, 43.0, 67.0, 102.0, 125.0, 196.0, 311.0, 429.0, 610.0, 1034.0, 1450.0, 2194.0, 3584.0, 5501.0, 8884.0, 14653.0, 24087.0, 41929.0, 78803.0, 175503.0, 1442104.0, 136533.0, 66270.0, 36669.0, 21320.0, 12706.0, 7775.0, 4820.0, 3168.0, 2084.0, 1300.0, 900.0, 583.0, 387.0, 310.0, 190.0, 124.0, 77.0, 85.0, 44.0, 27.0, 21.0, 14.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 4.0], "bins": [-0.10760498046875, -0.10447406768798828, -0.10134315490722656, -0.09821224212646484, -0.09508132934570312, -0.0919504165649414, -0.08881950378417969, -0.08568859100341797, -0.08255767822265625, -0.07942676544189453, -0.07629585266113281, -0.0731649398803711, -0.07003402709960938, -0.06690311431884766, -0.06377220153808594, -0.06064128875732422, -0.0575103759765625, -0.05437946319580078, -0.05124855041503906, -0.048117637634277344, -0.044986724853515625, -0.041855812072753906, -0.03872489929199219, -0.03559398651123047, -0.03246307373046875, -0.02933216094970703, -0.026201248168945312, -0.023070335388183594, -0.019939422607421875, -0.016808509826660156, -0.013677597045898438, -0.010546684265136719, -0.007415771484375, -0.004284858703613281, -0.0011539459228515625, 0.0019769668579101562, 0.005107879638671875, 0.008238792419433594, 0.011369705200195312, 0.014500617980957031, 0.01763153076171875, 0.02076244354248047, 0.023893356323242188, 0.027024269104003906, 0.030155181884765625, 0.033286094665527344, 0.03641700744628906, 0.03954792022705078, 0.0426788330078125, 0.04580974578857422, 0.04894065856933594, 0.052071571350097656, 0.055202484130859375, 0.058333396911621094, 0.06146430969238281, 0.06459522247314453, 0.06772613525390625, 0.07085704803466797, 0.07398796081542969, 0.0771188735961914, 0.08024978637695312, 0.08338069915771484, 0.08651161193847656, 0.08964252471923828, 0.0927734375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 4.0, 5.0, 13.0, 16.0, 25.0, 28.0, 33.0, 79.0, 95.0, 151.0, 156.0, 134.0, 82.0, 59.0, 31.0, 19.0, 15.0, 9.0, 6.0, 8.0, 2.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3365020751953125e-05, -2.2738240659236908e-05, -2.211146056652069e-05, -2.1484680473804474e-05, -2.0857900381088257e-05, -2.023112028837204e-05, -1.9604340195655823e-05, -1.8977560102939606e-05, -1.835078001022339e-05, -1.772399991750717e-05, -1.7097219824790955e-05, -1.6470439732074738e-05, -1.584365963935852e-05, -1.5216879546642303e-05, -1.4590099453926086e-05, -1.396331936120987e-05, -1.3336539268493652e-05, -1.2709759175777435e-05, -1.2082979083061218e-05, -1.1456198990345001e-05, -1.0829418897628784e-05, -1.0202638804912567e-05, -9.57585871219635e-06, -8.949078619480133e-06, -8.322298526763916e-06, -7.695518434047699e-06, -7.068738341331482e-06, -6.441958248615265e-06, -5.815178155899048e-06, -5.188398063182831e-06, -4.561617970466614e-06, -3.934837877750397e-06, -3.3080577850341797e-06, -2.6812776923179626e-06, -2.0544975996017456e-06, -1.4277175068855286e-06, -8.009374141693115e-07, -1.7415732145309448e-07, 4.5262277126312256e-07, 1.0794028639793396e-06, 1.7061829566955566e-06, 2.3329630494117737e-06, 2.9597431421279907e-06, 3.5865232348442078e-06, 4.213303327560425e-06, 4.840083420276642e-06, 5.466863512992859e-06, 6.093643605709076e-06, 6.720423698425293e-06, 7.34720379114151e-06, 7.973983883857727e-06, 8.600763976573944e-06, 9.227544069290161e-06, 9.854324162006378e-06, 1.0481104254722595e-05, 1.1107884347438812e-05, 1.173466444015503e-05, 1.2361444532871246e-05, 1.2988224625587463e-05, 1.361500471830368e-05, 1.4241784811019897e-05, 1.4868564903736115e-05, 1.549534499645233e-05, 1.612212508916855e-05, 1.6748905181884766e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 4.0, 11.0, 14.0, 15.0, 29.0, 35.0, 34.0, 42.0, 64.0, 110.0, 339.0, 1311.0, 8454.0, 83577.0, 829750.0, 112184.0, 10238.0, 1604.0, 329.0, 119.0, 61.0, 65.0, 38.0, 16.0, 22.0, 13.0, 9.0, 14.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025916099548339844, -0.0002497546374797821, -0.00024034827947616577, -0.00023094192147254944, -0.0002215355634689331, -0.00021212920546531677, -0.00020272284746170044, -0.0001933164894580841, -0.00018391013145446777, -0.00017450377345085144, -0.0001650974154472351, -0.00015569105744361877, -0.00014628469944000244, -0.0001368783414363861, -0.00012747198343276978, -0.00011806562542915344, -0.00010865926742553711, -9.925290942192078e-05, -8.984655141830444e-05, -8.044019341468811e-05, -7.103383541107178e-05, -6.162747740745544e-05, -5.222111940383911e-05, -4.281476140022278e-05, -3.3408403396606445e-05, -2.4002045392990112e-05, -1.459568738937378e-05, -5.189329385757446e-06, 4.217028617858887e-06, 1.362338662147522e-05, 2.3029744625091553e-05, 3.2436102628707886e-05, 4.184246063232422e-05, 5.124881863594055e-05, 6.0655176639556885e-05, 7.006153464317322e-05, 7.946789264678955e-05, 8.887425065040588e-05, 9.828060865402222e-05, 0.00010768696665763855, 0.00011709332466125488, 0.00012649968266487122, 0.00013590604066848755, 0.00014531239867210388, 0.00015471875667572021, 0.00016412511467933655, 0.00017353147268295288, 0.00018293783068656921, 0.00019234418869018555, 0.00020175054669380188, 0.0002111569046974182, 0.00022056326270103455, 0.00022996962070465088, 0.0002393759787082672, 0.00024878233671188354, 0.0002581886947154999, 0.0002675950527191162, 0.00027700141072273254, 0.0002864077687263489, 0.0002958141267299652, 0.00030522048473358154, 0.0003146268427371979, 0.0003240332007408142, 0.00033343955874443054, 0.0003428459167480469]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 12.0, 37.0, 71.0, 222.0, 413.0, 150.0, 61.0, 17.0, 16.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.274767606053501e-05, -8.079318649834022e-05, -7.883869693614542e-05, -7.688420009799302e-05, -7.492971053579822e-05, -7.297522097360343e-05, -7.102072413545102e-05, -6.906623457325622e-05, -6.711174501106143e-05, -6.515725544886664e-05, -6.320276588667184e-05, -6.124826904851943e-05, -5.929377948632464e-05, -5.7339289924129844e-05, -5.538479672395624e-05, -5.343030352378264e-05, -5.1475813961587846e-05, -4.952132439939305e-05, -4.756683119921945e-05, -4.561233799904585e-05, -4.3657848436851054e-05, -4.170335887465626e-05, -3.974886567448266e-05, -3.779437247430906e-05, -3.583988291211426e-05, -3.388539334991947e-05, -3.193090014974587e-05, -2.997640876856167e-05, -2.802191738737747e-05, -2.6067426006193273e-05, -2.4112934625009075e-05, -2.2158443243824877e-05, -2.020395186264068e-05, -1.824946048145648e-05, -1.6294969100272283e-05, -1.4340477719088085e-05, -1.2385986337903887e-05, -1.0431494956719689e-05, -8.477003575535491e-06, -6.522512194351293e-06, -4.568020813167095e-06, -2.6135294319828972e-06, -6.590380507986993e-07, 1.2954533303854987e-06, 3.2499447115696967e-06, 5.204436092753895e-06, 7.158927473938093e-06, 9.11341885512229e-06, 1.1067910236306489e-05, 1.3022401617490686e-05, 1.4976892998674884e-05, 1.6931384379859082e-05, 1.888587576104328e-05, 2.084036714222748e-05, 2.2794858523411676e-05, 2.4749349904595874e-05, 2.6703841285780072e-05, 2.865833266696427e-05, 3.061282404814847e-05, 3.256731724832207e-05, 3.4521806810516864e-05, 3.647629637271166e-05, 3.843078957288526e-05, 4.038528277305886e-05, 4.2339772335253656e-05]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 5.0, 5.0, 13.0, 10.0, 12.0, 10.0, 18.0, 17.0, 31.0, 18.0, 33.0, 27.0, 34.0, 22.0, 53.0, 26.0, 37.0, 50.0, 46.0, 43.0, 41.0, 42.0, 44.0, 37.0, 27.0, 32.0, 34.0, 33.0, 25.0, 28.0, 20.0, 23.0, 16.0, 21.0, 8.0, 15.0, 8.0, 9.0, 2.0, 7.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.3909759521484375e-06, -7.183291018009186e-06, -6.975606083869934e-06, -6.767921149730682e-06, -6.560236215591431e-06, -6.352551281452179e-06, -6.144866347312927e-06, -5.9371814131736755e-06, -5.729496479034424e-06, -5.521811544895172e-06, -5.31412661075592e-06, -5.106441676616669e-06, -4.898756742477417e-06, -4.691071808338165e-06, -4.4833868741989136e-06, -4.275701940059662e-06, -4.06801700592041e-06, -3.8603320717811584e-06, -3.6526471376419067e-06, -3.444962203502655e-06, -3.2372772693634033e-06, -3.0295923352241516e-06, -2.8219074010849e-06, -2.614222466945648e-06, -2.4065375328063965e-06, -2.1988525986671448e-06, -1.991167664527893e-06, -1.7834827303886414e-06, -1.5757977962493896e-06, -1.368112862110138e-06, -1.1604279279708862e-06, -9.527429938316345e-07, -7.450580596923828e-07, -5.373731255531311e-07, -3.296881914138794e-07, -1.2200325727462769e-07, 8.568167686462402e-08, 2.9336661100387573e-07, 5.010515451431274e-07, 7.087364792823792e-07, 9.164214134216309e-07, 1.1241063475608826e-06, 1.3317912817001343e-06, 1.539476215839386e-06, 1.7471611499786377e-06, 1.9548460841178894e-06, 2.162531018257141e-06, 2.370215952396393e-06, 2.5779008865356445e-06, 2.7855858206748962e-06, 2.993270754814148e-06, 3.2009556889533997e-06, 3.4086406230926514e-06, 3.616325557231903e-06, 3.824010491371155e-06, 4.0316954255104065e-06, 4.239380359649658e-06, 4.44706529378891e-06, 4.654750227928162e-06, 4.862435162067413e-06, 5.070120096206665e-06, 5.277805030345917e-06, 5.4854899644851685e-06, 5.69317489862442e-06, 5.900859832763672e-06]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 5.0, 10.0, 3.0, 6.0, 20.0, 13.0, 18.0, 23.0, 17.0, 35.0, 43.0, 40.0, 38.0, 39.0, 30.0, 45.0, 48.0, 48.0, 46.0, 36.0, 44.0, 32.0, 28.0, 49.0, 26.0, 36.0, 32.0, 29.0, 22.0, 16.0, 13.0, 17.0, 16.0, 14.0, 13.0, 11.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.728515625, -1.66839599609375, -1.6082763671875, -1.54815673828125, -1.488037109375, -1.42791748046875, -1.3677978515625, -1.30767822265625, -1.24755859375, -1.18743896484375, -1.1273193359375, -1.06719970703125, -1.007080078125, -0.94696044921875, -0.8868408203125, -0.82672119140625, -0.7666015625, -0.70648193359375, -0.6463623046875, -0.58624267578125, -0.526123046875, -0.46600341796875, -0.4058837890625, -0.34576416015625, -0.28564453125, -0.22552490234375, -0.1654052734375, -0.10528564453125, -0.045166015625, 0.01495361328125, 0.0750732421875, 0.13519287109375, 0.1953125, 0.25543212890625, 0.3155517578125, 0.37567138671875, 0.435791015625, 0.49591064453125, 0.5560302734375, 0.61614990234375, 0.67626953125, 0.73638916015625, 0.7965087890625, 0.85662841796875, 0.916748046875, 0.97686767578125, 1.0369873046875, 1.09710693359375, 1.1572265625, 1.21734619140625, 1.2774658203125, 1.33758544921875, 1.397705078125, 1.45782470703125, 1.5179443359375, 1.57806396484375, 1.63818359375, 1.69830322265625, 1.7584228515625, 1.81854248046875, 1.878662109375, 1.93878173828125, 1.9989013671875, 2.05902099609375, 2.119140625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 14.0, 11.0, 20.0, 33.0, 42.0, 38.0, 58.0, 93.0, 128.0, 147.0, 261.0, 388.0, 586.0, 1051.0, 1833.0, 3484.0, 7271.0, 16545.0, 40769.0, 113750.0, 435579.0, 283182.0, 85408.0, 31613.0, 13360.0, 5905.0, 2968.0, 1556.0, 865.0, 511.0, 320.0, 207.0, 163.0, 109.0, 74.0, 52.0, 36.0, 28.0, 27.0, 9.0, 14.0, 4.0, 7.0, 6.0, 0.0, 6.0, 9.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-2.7734375, -2.6864013671875, -2.599365234375, -2.5123291015625, -2.42529296875, -2.3382568359375, -2.251220703125, -2.1641845703125, -2.0771484375, -1.9901123046875, -1.903076171875, -1.8160400390625, -1.72900390625, -1.6419677734375, -1.554931640625, -1.4678955078125, -1.380859375, -1.2938232421875, -1.206787109375, -1.1197509765625, -1.03271484375, -0.9456787109375, -0.858642578125, -0.7716064453125, -0.6845703125, -0.5975341796875, -0.510498046875, -0.4234619140625, -0.33642578125, -0.2493896484375, -0.162353515625, -0.0753173828125, 0.01171875, 0.0987548828125, 0.185791015625, 0.2728271484375, 0.35986328125, 0.4468994140625, 0.533935546875, 0.6209716796875, 0.7080078125, 0.7950439453125, 0.882080078125, 0.9691162109375, 1.05615234375, 1.1431884765625, 1.230224609375, 1.3172607421875, 1.404296875, 1.4913330078125, 1.578369140625, 1.6654052734375, 1.75244140625, 1.8394775390625, 1.926513671875, 2.0135498046875, 2.1005859375, 2.1876220703125, 2.274658203125, 2.3616943359375, 2.44873046875, 2.5357666015625, 2.622802734375, 2.7098388671875, 2.796875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 10.0, 7.0, 3.0, 13.0, 11.0, 18.0, 21.0, 21.0, 28.0, 28.0, 17.0, 30.0, 42.0, 33.0, 41.0, 62.0, 63.0, 131.0, 1905.0, 92.0, 51.0, 52.0, 33.0, 40.0, 39.0, 28.0, 34.0, 33.0, 23.0, 24.0, 20.0, 19.0, 11.0, 9.0, 16.0, 11.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.50897216796875, -6.2874755859375, -6.06597900390625, -5.844482421875, -5.62298583984375, -5.4014892578125, -5.17999267578125, -4.95849609375, -4.73699951171875, -4.5155029296875, -4.29400634765625, -4.072509765625, -3.85101318359375, -3.6295166015625, -3.40802001953125, -3.1865234375, -2.96502685546875, -2.7435302734375, -2.52203369140625, -2.300537109375, -2.07904052734375, -1.8575439453125, -1.63604736328125, -1.41455078125, -1.19305419921875, -0.9715576171875, -0.75006103515625, -0.528564453125, -0.30706787109375, -0.0855712890625, 0.13592529296875, 0.357421875, 0.57891845703125, 0.8004150390625, 1.02191162109375, 1.243408203125, 1.46490478515625, 1.6864013671875, 1.90789794921875, 2.12939453125, 2.35089111328125, 2.5723876953125, 2.79388427734375, 3.015380859375, 3.23687744140625, 3.4583740234375, 3.67987060546875, 3.9013671875, 4.12286376953125, 4.3443603515625, 4.56585693359375, 4.787353515625, 5.00885009765625, 5.2303466796875, 5.45184326171875, 5.67333984375, 5.89483642578125, 6.1163330078125, 6.33782958984375, 6.559326171875, 6.78082275390625, 7.0023193359375, 7.22381591796875, 7.4453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 12.0, 11.0, 11.0, 12.0, 22.0, 19.0, 27.0, 21.0, 39.0, 45.0, 49.0, 74.0, 101.0, 147.0, 306.0, 890.0, 7849.0, 2971310.0, 160385.0, 3085.0, 558.0, 233.0, 113.0, 83.0, 59.0, 47.0, 21.0, 34.0, 28.0, 23.0, 19.0, 9.0, 13.0, 2.0, 8.0, 11.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.34375, -17.801513671875, -17.25927734375, -16.717041015625, -16.1748046875, -15.632568359375, -15.09033203125, -14.548095703125, -14.005859375, -13.463623046875, -12.92138671875, -12.379150390625, -11.8369140625, -11.294677734375, -10.75244140625, -10.210205078125, -9.66796875, -9.125732421875, -8.58349609375, -8.041259765625, -7.4990234375, -6.956787109375, -6.41455078125, -5.872314453125, -5.330078125, -4.787841796875, -4.24560546875, -3.703369140625, -3.1611328125, -2.618896484375, -2.07666015625, -1.534423828125, -0.9921875, -0.449951171875, 0.09228515625, 0.634521484375, 1.1767578125, 1.718994140625, 2.26123046875, 2.803466796875, 3.345703125, 3.887939453125, 4.43017578125, 4.972412109375, 5.5146484375, 6.056884765625, 6.59912109375, 7.141357421875, 7.68359375, 8.225830078125, 8.76806640625, 9.310302734375, 9.8525390625, 10.394775390625, 10.93701171875, 11.479248046875, 12.021484375, 12.563720703125, 13.10595703125, 13.648193359375, 14.1904296875, 14.732666015625, 15.27490234375, 15.817138671875, 16.359375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 23.0, 47.0, 93.0, 256.0, 267.0, 184.0, 82.0, 34.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.424560546875, -20.915821075439453, -20.407081604003906, -19.898340225219727, -19.38960075378418, -18.880861282348633, -18.372121810913086, -17.86338233947754, -17.35464096069336, -16.845901489257812, -16.337162017822266, -15.828421592712402, -15.319681167602539, -14.810941696166992, -14.302202224731445, -13.793462753295898, -13.284723281860352, -12.775983810424805, -12.267243385314941, -11.758503913879395, -11.249763488769531, -10.741024017333984, -10.232284545898438, -9.72354507446289, -9.214804649353027, -8.70606517791748, -8.197324752807617, -7.68858528137207, -7.179845333099365, -6.67110538482666, -6.162365913391113, -5.653625965118408, -5.144887924194336, -4.636147975921631, -4.127408027648926, -3.618668556213379, -3.109928607940674, -2.6011886596679688, -2.0924489498138428, -1.5837092399597168, -1.0749692916870117, -0.5662294626235962, -0.057489633560180664, 0.45125019550323486, 0.9599900245666504, 1.4687299728393555, 1.9774696826934814, 2.4862093925476074, 2.9949493408203125, 3.5036892890930176, 4.012429237365723, 4.5211687088012695, 5.029908657073975, 5.53864860534668, 6.047388076782227, 6.556128025054932, 7.064867973327637, 7.573607921600342, 8.082347869873047, 8.591087341308594, 9.09982681274414, 9.608567237854004, 10.11730670928955, 10.626047134399414, 11.134786605834961]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 13.0, 14.0, 16.0, 15.0, 13.0, 35.0, 16.0, 27.0, 30.0, 32.0, 39.0, 37.0, 31.0, 34.0, 45.0, 45.0, 52.0, 41.0, 51.0, 44.0, 35.0, 29.0, 34.0, 30.0, 26.0, 29.0, 30.0, 23.0, 20.0, 23.0, 15.0, 6.0, 14.0, 4.0, 5.0, 8.0, 5.0, 0.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.145593643188477, -22.424327850341797, -21.70306396484375, -20.98179817199707, -20.26053237915039, -19.539268493652344, -18.818002700805664, -18.096736907958984, -17.375473022460938, -16.654207229614258, -15.932943344116211, -15.211677551269531, -14.490412712097168, -13.769147872924805, -13.047882080078125, -12.326617240905762, -11.605352401733398, -10.884087562561035, -10.162822723388672, -9.441556930541992, -8.720292091369629, -7.999027252197266, -7.277761936187744, -6.556496620178223, -5.835231781005859, -5.113966941833496, -4.392701625823975, -3.6714365482330322, -2.95017147064209, -2.2289063930511475, -1.507641315460205, -0.7863759994506836, -0.06511306762695312, 0.6561520099639893, 1.3774170875549316, 2.098682165145874, 2.8199472427368164, 3.541212320327759, 4.262477397918701, 4.983742713928223, 5.705007553100586, 6.426272392272949, 7.147537708282471, 7.868803024291992, 8.590067863464355, 9.311332702636719, 10.032598495483398, 10.753863334655762, 11.475128173828125, 12.196393013000488, 12.917657852172852, 13.638923645019531, 14.360188484191895, 15.081453323364258, 15.802719116210938, 16.523983001708984, 17.245248794555664, 17.966514587402344, 18.68777847290039, 19.40904426574707, 20.13031005859375, 20.851573944091797, 21.572839736938477, 22.294105529785156, 23.015369415283203]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 6.0, 5.0, 19.0, 13.0, 20.0, 18.0, 21.0, 35.0, 48.0, 42.0, 31.0, 34.0, 35.0, 42.0, 47.0, 49.0, 53.0, 36.0, 44.0, 33.0, 31.0, 40.0, 34.0, 33.0, 34.0, 19.0, 22.0, 26.0, 12.0, 17.0, 16.0, 14.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.775390625, -1.713653564453125, -1.65191650390625, -1.590179443359375, -1.5284423828125, -1.466705322265625, -1.40496826171875, -1.343231201171875, -1.281494140625, -1.219757080078125, -1.15802001953125, -1.096282958984375, -1.0345458984375, -0.972808837890625, -0.91107177734375, -0.849334716796875, -0.78759765625, -0.725860595703125, -0.66412353515625, -0.602386474609375, -0.5406494140625, -0.478912353515625, -0.41717529296875, -0.355438232421875, -0.293701171875, -0.231964111328125, -0.17022705078125, -0.108489990234375, -0.0467529296875, 0.014984130859375, 0.07672119140625, 0.138458251953125, 0.2001953125, 0.261932373046875, 0.32366943359375, 0.385406494140625, 0.4471435546875, 0.508880615234375, 0.57061767578125, 0.632354736328125, 0.694091796875, 0.755828857421875, 0.81756591796875, 0.879302978515625, 0.9410400390625, 1.002777099609375, 1.06451416015625, 1.126251220703125, 1.18798828125, 1.249725341796875, 1.31146240234375, 1.373199462890625, 1.4349365234375, 1.496673583984375, 1.55841064453125, 1.620147705078125, 1.681884765625, 1.743621826171875, 1.80535888671875, 1.867095947265625, 1.9288330078125, 1.990570068359375, 2.05230712890625, 2.114044189453125, 2.17578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 4.0, 9.0, 7.0, 20.0, 22.0, 21.0, 22.0, 43.0, 51.0, 76.0, 100.0, 145.0, 270.0, 582.0, 1543.0, 6477.0, 52731.0, 1423769.0, 2617382.0, 77888.0, 9202.0, 2039.0, 765.0, 379.0, 225.0, 127.0, 97.0, 69.0, 47.0, 45.0, 26.0, 20.0, 14.0, 10.0, 8.0, 10.0, 7.0, 9.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.1424560546875, -9.738037109375, -9.3336181640625, -8.92919921875, -8.5247802734375, -8.120361328125, -7.7159423828125, -7.3115234375, -6.9071044921875, -6.502685546875, -6.0982666015625, -5.69384765625, -5.2894287109375, -4.885009765625, -4.4805908203125, -4.076171875, -3.6717529296875, -3.267333984375, -2.8629150390625, -2.45849609375, -2.0540771484375, -1.649658203125, -1.2452392578125, -0.8408203125, -0.4364013671875, -0.031982421875, 0.3724365234375, 0.77685546875, 1.1812744140625, 1.585693359375, 1.9901123046875, 2.39453125, 2.7989501953125, 3.203369140625, 3.6077880859375, 4.01220703125, 4.4166259765625, 4.821044921875, 5.2254638671875, 5.6298828125, 6.0343017578125, 6.438720703125, 6.8431396484375, 7.24755859375, 7.6519775390625, 8.056396484375, 8.4608154296875, 8.865234375, 9.2696533203125, 9.674072265625, 10.0784912109375, 10.48291015625, 10.8873291015625, 11.291748046875, 11.6961669921875, 12.1005859375, 12.5050048828125, 12.909423828125, 13.3138427734375, 13.71826171875, 14.1226806640625, 14.527099609375, 14.9315185546875, 15.3359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 8.0, 10.0, 19.0, 14.0, 18.0, 30.0, 61.0, 57.0, 90.0, 118.0, 153.0, 260.0, 358.0, 428.0, 577.0, 498.0, 370.0, 263.0, 228.0, 163.0, 99.0, 77.0, 46.0, 29.0, 32.0, 15.0, 13.0, 7.0, 10.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.69140625, -7.481689453125, -7.27197265625, -7.062255859375, -6.8525390625, -6.642822265625, -6.43310546875, -6.223388671875, -6.013671875, -5.803955078125, -5.59423828125, -5.384521484375, -5.1748046875, -4.965087890625, -4.75537109375, -4.545654296875, -4.3359375, -4.126220703125, -3.91650390625, -3.706787109375, -3.4970703125, -3.287353515625, -3.07763671875, -2.867919921875, -2.658203125, -2.448486328125, -2.23876953125, -2.029052734375, -1.8193359375, -1.609619140625, -1.39990234375, -1.190185546875, -0.98046875, -0.770751953125, -0.56103515625, -0.351318359375, -0.1416015625, 0.068115234375, 0.27783203125, 0.487548828125, 0.697265625, 0.906982421875, 1.11669921875, 1.326416015625, 1.5361328125, 1.745849609375, 1.95556640625, 2.165283203125, 2.375, 2.584716796875, 2.79443359375, 3.004150390625, 3.2138671875, 3.423583984375, 3.63330078125, 3.843017578125, 4.052734375, 4.262451171875, 4.47216796875, 4.681884765625, 4.8916015625, 5.101318359375, 5.31103515625, 5.520751953125, 5.73046875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 8.0, 11.0, 15.0, 19.0, 43.0, 57.0, 102.0, 190.0, 375.0, 748.0, 2028.0, 7562.0, 42924.0, 403805.0, 3217033.0, 459556.0, 47656.0, 8277.0, 2242.0, 818.0, 366.0, 197.0, 85.0, 64.0, 37.0, 22.0, 15.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2734375, -14.7730712890625, -14.272705078125, -13.7723388671875, -13.27197265625, -12.7716064453125, -12.271240234375, -11.7708740234375, -11.2705078125, -10.7701416015625, -10.269775390625, -9.7694091796875, -9.26904296875, -8.7686767578125, -8.268310546875, -7.7679443359375, -7.267578125, -6.7672119140625, -6.266845703125, -5.7664794921875, -5.26611328125, -4.7657470703125, -4.265380859375, -3.7650146484375, -3.2646484375, -2.7642822265625, -2.263916015625, -1.7635498046875, -1.26318359375, -0.7628173828125, -0.262451171875, 0.2379150390625, 0.73828125, 1.2386474609375, 1.739013671875, 2.2393798828125, 2.73974609375, 3.2401123046875, 3.740478515625, 4.2408447265625, 4.7412109375, 5.2415771484375, 5.741943359375, 6.2423095703125, 6.74267578125, 7.2430419921875, 7.743408203125, 8.2437744140625, 8.744140625, 9.2445068359375, 9.744873046875, 10.2452392578125, 10.74560546875, 11.2459716796875, 11.746337890625, 12.2467041015625, 12.7470703125, 13.2474365234375, 13.747802734375, 14.2481689453125, 14.74853515625, 15.2489013671875, 15.749267578125, 16.2496337890625, 16.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 8.0, 7.0, 14.0, 37.0, 90.0, 149.0, 190.0, 190.0, 154.0, 107.0, 36.0, 18.0, 11.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.54336929321289, -17.617279052734375, -15.691190719604492, -13.765101432800293, -11.839012145996094, -9.912922859191895, -7.986833572387695, -6.060744285583496, -4.134654998779297, -2.2085657119750977, -0.28247642517089844, 1.6436128616333008, 3.5697021484375, 5.495791435241699, 7.421880722045898, 9.347970008850098, 11.274059295654297, 13.200148582458496, 15.126237869262695, 17.052326202392578, 18.978416442871094, 20.90450668334961, 22.830595016479492, 24.756683349609375, 26.68277359008789, 28.608863830566406, 30.53495216369629, 32.46104049682617, 34.38713073730469, 36.3132209777832, 38.23931121826172, 40.16539764404297, 42.09149169921875, 44.017581939697266, 45.94367218017578, 47.86975860595703, 49.79584884643555, 51.72193908691406, 53.64802551269531, 55.57411575317383, 57.500205993652344, 59.42629623413086, 61.352386474609375, 63.278472900390625, 65.20455932617188, 67.13065338134766, 69.0567398071289, 70.98283386230469, 72.90892028808594, 74.83500671386719, 76.76110076904297, 78.68718719482422, 80.61328125, 82.53936767578125, 84.4654541015625, 86.39154815673828, 88.31763458251953, 90.24372100830078, 92.16981506347656, 94.09590148925781, 96.02198791503906, 97.94808197021484, 99.8741683959961, 101.80026245117188, 103.72634887695312]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 9.0, 7.0, 4.0, 8.0, 7.0, 8.0, 8.0, 9.0, 9.0, 21.0, 19.0, 18.0, 29.0, 23.0, 23.0, 26.0, 36.0, 28.0, 31.0, 30.0, 33.0, 44.0, 43.0, 42.0, 32.0, 36.0, 39.0, 44.0, 32.0, 32.0, 20.0, 26.0, 18.0, 27.0, 31.0, 29.0, 13.0, 16.0, 11.0, 15.0, 14.0, 11.0, 13.0, 10.0, 3.0, 3.0, 5.0, 7.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-19.619171142578125, -19.022232055664062, -18.42529296875, -17.82835578918457, -17.231416702270508, -16.634477615356445, -16.037540435791016, -15.440601348876953, -14.84366226196289, -14.246723175048828, -13.649785041809082, -13.052846908569336, -12.455907821655273, -11.858968734741211, -11.262030601501465, -10.665092468261719, -10.068153381347656, -9.471214294433594, -8.874276161193848, -8.277338027954102, -7.680398941040039, -7.083460330963135, -6.4865217208862305, -5.889583110809326, -5.292644500732422, -4.695705890655518, -4.098767280578613, -3.501828670501709, -2.9048900604248047, -2.3079514503479004, -1.711012840270996, -1.1140742301940918, -0.5171356201171875, 0.0798029899597168, 0.6767416000366211, 1.2736802101135254, 1.8706188201904297, 2.467557430267334, 3.0644960403442383, 3.6614346504211426, 4.258373260498047, 4.855311870574951, 5.4522504806518555, 6.04918909072876, 6.646127700805664, 7.243066310882568, 7.840004920959473, 8.436943054199219, 9.033882141113281, 9.630821228027344, 10.22775936126709, 10.824697494506836, 11.421636581420898, 12.018575668334961, 12.615513801574707, 13.212451934814453, 13.809391021728516, 14.406330108642578, 15.003268241882324, 15.60020637512207, 16.197145462036133, 16.794084548950195, 17.391021728515625, 17.987960815429688, 18.58489990234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 3.0, 7.0, 6.0, 7.0, 19.0, 26.0, 17.0, 34.0, 32.0, 38.0, 37.0, 30.0, 29.0, 46.0, 27.0, 48.0, 37.0, 55.0, 52.0, 39.0, 33.0, 35.0, 34.0, 35.0, 36.0, 30.0, 28.0, 27.0, 26.0, 22.0, 10.0, 12.0, 13.0, 11.0, 9.0, 11.0, 3.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5830078125, -1.5199432373046875, -1.456878662109375, -1.3938140869140625, -1.33074951171875, -1.2676849365234375, -1.204620361328125, -1.1415557861328125, -1.0784912109375, -1.0154266357421875, -0.952362060546875, -0.8892974853515625, -0.82623291015625, -0.7631683349609375, -0.700103759765625, -0.6370391845703125, -0.573974609375, -0.5109100341796875, -0.447845458984375, -0.3847808837890625, -0.32171630859375, -0.2586517333984375, -0.195587158203125, -0.1325225830078125, -0.0694580078125, -0.0063934326171875, 0.056671142578125, 0.1197357177734375, 0.18280029296875, 0.2458648681640625, 0.308929443359375, 0.3719940185546875, 0.43505859375, 0.4981231689453125, 0.561187744140625, 0.6242523193359375, 0.68731689453125, 0.7503814697265625, 0.813446044921875, 0.8765106201171875, 0.9395751953125, 1.0026397705078125, 1.065704345703125, 1.1287689208984375, 1.19183349609375, 1.2548980712890625, 1.317962646484375, 1.3810272216796875, 1.444091796875, 1.5071563720703125, 1.570220947265625, 1.6332855224609375, 1.69635009765625, 1.7594146728515625, 1.822479248046875, 1.8855438232421875, 1.9486083984375, 2.0116729736328125, 2.074737548828125, 2.1378021240234375, 2.20086669921875, 2.2639312744140625, 2.326995849609375, 2.3900604248046875, 2.453125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 7.0, 4.0, 18.0, 19.0, 30.0, 41.0, 57.0, 87.0, 140.0, 230.0, 321.0, 531.0, 792.0, 1089.0, 1664.0, 2733.0, 4272.0, 6930.0, 11733.0, 19175.0, 32883.0, 58061.0, 107647.0, 310413.0, 254140.0, 101189.0, 55670.0, 31588.0, 17995.0, 10716.0, 6556.0, 3989.0, 2647.0, 1658.0, 1104.0, 761.0, 515.0, 334.0, 229.0, 184.0, 114.0, 82.0, 68.0, 48.0, 35.0, 17.0, 11.0, 9.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.220703125, -0.2140064239501953, -0.20730972290039062, -0.20061302185058594, -0.19391632080078125, -0.18721961975097656, -0.18052291870117188, -0.1738262176513672, -0.1671295166015625, -0.1604328155517578, -0.15373611450195312, -0.14703941345214844, -0.14034271240234375, -0.13364601135253906, -0.12694931030273438, -0.12025260925292969, -0.113555908203125, -0.10685920715332031, -0.10016250610351562, -0.09346580505371094, -0.08676910400390625, -0.08007240295410156, -0.07337570190429688, -0.06667900085449219, -0.0599822998046875, -0.05328559875488281, -0.046588897705078125, -0.03989219665527344, -0.03319549560546875, -0.026498794555664062, -0.019802093505859375, -0.013105392456054688, -0.00640869140625, 0.0002880096435546875, 0.006984710693359375, 0.013681411743164062, 0.02037811279296875, 0.027074813842773438, 0.033771514892578125, 0.04046821594238281, 0.0471649169921875, 0.05386161804199219, 0.060558319091796875, 0.06725502014160156, 0.07395172119140625, 0.08064842224121094, 0.08734512329101562, 0.09404182434082031, 0.100738525390625, 0.10743522644042969, 0.11413192749023438, 0.12082862854003906, 0.12752532958984375, 0.13422203063964844, 0.14091873168945312, 0.1476154327392578, 0.1543121337890625, 0.1610088348388672, 0.16770553588867188, 0.17440223693847656, 0.18109893798828125, 0.18779563903808594, 0.19449234008789062, 0.2011890411376953, 0.2078857421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 4.0, 7.0, 10.0, 12.0, 8.0, 11.0, 9.0, 19.0, 18.0, 25.0, 28.0, 27.0, 25.0, 25.0, 35.0, 27.0, 35.0, 37.0, 35.0, 34.0, 31.0, 1057.0, 48.0, 43.0, 37.0, 43.0, 35.0, 28.0, 19.0, 23.0, 24.0, 37.0, 21.0, 23.0, 21.0, 17.0, 9.0, 8.0, 11.0, 12.0, 5.0, 7.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.46484375, -1.4234771728515625, -1.382110595703125, -1.3407440185546875, -1.29937744140625, -1.2580108642578125, -1.216644287109375, -1.1752777099609375, -1.1339111328125, -1.0925445556640625, -1.051177978515625, -1.0098114013671875, -0.96844482421875, -0.9270782470703125, -0.885711669921875, -0.8443450927734375, -0.802978515625, -0.7616119384765625, -0.720245361328125, -0.6788787841796875, -0.63751220703125, -0.5961456298828125, -0.554779052734375, -0.5134124755859375, -0.4720458984375, -0.4306793212890625, -0.389312744140625, -0.3479461669921875, -0.30657958984375, -0.2652130126953125, -0.223846435546875, -0.1824798583984375, -0.14111328125, -0.0997467041015625, -0.058380126953125, -0.0170135498046875, 0.02435302734375, 0.0657196044921875, 0.107086181640625, 0.1484527587890625, 0.1898193359375, 0.2311859130859375, 0.272552490234375, 0.3139190673828125, 0.35528564453125, 0.3966522216796875, 0.438018798828125, 0.4793853759765625, 0.520751953125, 0.5621185302734375, 0.603485107421875, 0.6448516845703125, 0.68621826171875, 0.7275848388671875, 0.768951416015625, 0.8103179931640625, 0.8516845703125, 0.8930511474609375, 0.934417724609375, 0.9757843017578125, 1.01715087890625, 1.0585174560546875, 1.099884033203125, 1.1412506103515625, 1.1826171875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 6.0, 7.0, 10.0, 16.0, 32.0, 35.0, 46.0, 73.0, 85.0, 140.0, 212.0, 300.0, 430.0, 611.0, 878.0, 1226.0, 1893.0, 2773.0, 4044.0, 6309.0, 9508.0, 14841.0, 23750.0, 39027.0, 68751.0, 136420.0, 1409927.0, 173667.0, 80877.0, 45430.0, 27112.0, 16836.0, 10566.0, 6905.0, 4585.0, 3032.0, 2019.0, 1447.0, 1039.0, 667.0, 475.0, 333.0, 227.0, 162.0, 132.0, 84.0, 61.0, 35.0, 34.0, 20.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.08404541015625, -0.08120918273925781, -0.07837295532226562, -0.07553672790527344, -0.07270050048828125, -0.06986427307128906, -0.06702804565429688, -0.06419181823730469, -0.0613555908203125, -0.05851936340332031, -0.055683135986328125, -0.05284690856933594, -0.05001068115234375, -0.04717445373535156, -0.044338226318359375, -0.04150199890136719, -0.038665771484375, -0.03582954406738281, -0.032993316650390625, -0.030157089233398438, -0.02732086181640625, -0.024484634399414062, -0.021648406982421875, -0.018812179565429688, -0.0159759521484375, -0.013139724731445312, -0.010303497314453125, -0.0074672698974609375, -0.00463104248046875, -0.0017948150634765625, 0.001041412353515625, 0.0038776397705078125, 0.0067138671875, 0.009550094604492188, 0.012386322021484375, 0.015222549438476562, 0.01805877685546875, 0.020895004272460938, 0.023731231689453125, 0.026567459106445312, 0.0294036865234375, 0.03223991394042969, 0.035076141357421875, 0.03791236877441406, 0.04074859619140625, 0.04358482360839844, 0.046421051025390625, 0.04925727844238281, 0.052093505859375, 0.05492973327636719, 0.057765960693359375, 0.06060218811035156, 0.06343841552734375, 0.06627464294433594, 0.06911087036132812, 0.07194709777832031, 0.0747833251953125, 0.07761955261230469, 0.08045578002929688, 0.08329200744628906, 0.08612823486328125, 0.08896446228027344, 0.09180068969726562, 0.09463691711425781, 0.09747314453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 3.0, 9.0, 8.0, 9.0, 20.0, 17.0, 8.0, 28.0, 27.0, 20.0, 40.0, 46.0, 58.0, 85.0, 91.0, 85.0, 85.0, 69.0, 50.0, 29.0, 30.0, 22.0, 31.0, 12.0, 10.0, 19.0, 19.0, 9.0, 6.0, 7.0, 9.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.245737075805664e-05, -1.2081116437911987e-05, -1.1704862117767334e-05, -1.132860779762268e-05, -1.0952353477478027e-05, -1.0576099157333374e-05, -1.019984483718872e-05, -9.823590517044067e-06, -9.447336196899414e-06, -9.07108187675476e-06, -8.694827556610107e-06, -8.318573236465454e-06, -7.9423189163208e-06, -7.5660645961761475e-06, -7.189810276031494e-06, -6.813555955886841e-06, -6.4373016357421875e-06, -6.061047315597534e-06, -5.684792995452881e-06, -5.3085386753082275e-06, -4.932284355163574e-06, -4.556030035018921e-06, -4.179775714874268e-06, -3.8035213947296143e-06, -3.427267074584961e-06, -3.0510127544403076e-06, -2.6747584342956543e-06, -2.298504114151001e-06, -1.9222497940063477e-06, -1.5459954738616943e-06, -1.169741153717041e-06, -7.934868335723877e-07, -4.172325134277344e-07, -4.0978193283081055e-08, 3.3527612686157227e-07, 7.115304470062256e-07, 1.087784767150879e-06, 1.4640390872955322e-06, 1.8402934074401855e-06, 2.216547727584839e-06, 2.592802047729492e-06, 2.9690563678741455e-06, 3.345310688018799e-06, 3.721565008163452e-06, 4.0978193283081055e-06, 4.474073648452759e-06, 4.850327968597412e-06, 5.2265822887420654e-06, 5.602836608886719e-06, 5.979090929031372e-06, 6.355345249176025e-06, 6.731599569320679e-06, 7.107853889465332e-06, 7.484108209609985e-06, 7.860362529754639e-06, 8.236616849899292e-06, 8.612871170043945e-06, 8.989125490188599e-06, 9.365379810333252e-06, 9.741634130477905e-06, 1.0117888450622559e-05, 1.0494142770767212e-05, 1.0870397090911865e-05, 1.1246651411056519e-05, 1.1622905731201172e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 5.0, 9.0, 6.0, 14.0, 15.0, 25.0, 21.0, 36.0, 61.0, 69.0, 137.0, 244.0, 597.0, 1476.0, 3880.0, 11195.0, 35815.0, 130439.0, 606651.0, 187855.0, 47188.0, 14666.0, 4810.0, 1812.0, 732.0, 305.0, 163.0, 105.0, 42.0, 41.0, 38.0, 21.0, 16.0, 15.0, 8.0, 8.0, 2.0, 3.0, 3.0, 6.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0001615285873413086, -0.00015641935169696808, -0.00015131011605262756, -0.00014620088040828705, -0.00014109164476394653, -0.00013598240911960602, -0.0001308731734752655, -0.000125763937830925, -0.00012065470218658447, -0.00011554546654224396, -0.00011043623089790344, -0.00010532699525356293, -0.00010021775960922241, -9.51085239648819e-05, -8.999928832054138e-05, -8.489005267620087e-05, -7.978081703186035e-05, -7.467158138751984e-05, -6.956234574317932e-05, -6.44531100988388e-05, -5.934387445449829e-05, -5.4234638810157776e-05, -4.912540316581726e-05, -4.4016167521476746e-05, -3.890693187713623e-05, -3.3797696232795715e-05, -2.86884605884552e-05, -2.3579224944114685e-05, -1.846998929977417e-05, -1.3360753655433655e-05, -8.25151801109314e-06, -3.1422823667526245e-06, 1.9669532775878906e-06, 7.076188921928406e-06, 1.2185424566268921e-05, 1.7294660210609436e-05, 2.240389585494995e-05, 2.7513131499290466e-05, 3.262236714363098e-05, 3.7731602787971497e-05, 4.284083843231201e-05, 4.795007407665253e-05, 5.305930972099304e-05, 5.816854536533356e-05, 6.327778100967407e-05, 6.838701665401459e-05, 7.34962522983551e-05, 7.860548794269562e-05, 8.371472358703613e-05, 8.882395923137665e-05, 9.393319487571716e-05, 9.904243052005768e-05, 0.0001041516661643982, 0.00010926090180873871, 0.00011437013745307922, 0.00011947937309741974, 0.00012458860874176025, 0.00012969784438610077, 0.00013480708003044128, 0.0001399163156747818, 0.00014502555131912231, 0.00015013478696346283, 0.00015524402260780334, 0.00016035325825214386, 0.00016546249389648438]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 6.0, 2.0, 11.0, 27.0, 22.0, 34.0, 58.0, 132.0, 226.0, 213.0, 116.0, 56.0, 36.0, 20.0, 13.0, 12.0, 12.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787805558706168e-05, -1.6760122889536433e-05, -1.5642190192011185e-05, -1.4524258403980639e-05, -1.3406326615950093e-05, -1.2288393918424845e-05, -1.1170461220899597e-05, -1.005252943286905e-05, -8.934596735343803e-06, -7.816664037818555e-06, -6.698732249788009e-06, -5.580799552262761e-06, -4.462867309484864e-06, -3.3449350667069666e-06, -2.2270023691817187e-06, -1.1090705811511725e-06, 8.862116374075413e-09, 1.1267944728388102e-06, 2.244726829303545e-06, 3.3626592994551174e-06, 4.4805915422330145e-06, 5.5985237850109115e-06, 6.7164564825361595e-06, 7.834388270566706e-06, 8.952320968091954e-06, 1.0070253665617201e-05, 1.1188185453647748e-05, 1.2306118151172996e-05, 1.3424050848698243e-05, 1.454198263672879e-05, 1.565991624374874e-05, 1.6777847122284584e-05, 1.7895781638799235e-05, 1.9013714336324483e-05, 2.013164703384973e-05, 2.124957973137498e-05, 2.2367510609910823e-05, 2.348544330743607e-05, 2.460337600496132e-05, 2.5721306883497164e-05, 2.683923958102241e-05, 2.795717227854766e-05, 2.9075104976072907e-05, 3.0193037673598155e-05, 3.13109703711234e-05, 3.2428899430669844e-05, 3.35468357661739e-05, 3.466476482572034e-05, 3.5782701161224395e-05, 3.690063385874964e-05, 3.801856655627489e-05, 3.913649925380014e-05, 4.025443195132539e-05, 4.137236101087183e-05, 4.249029734637588e-05, 4.3608226405922323e-05, 4.472615910344757e-05, 4.584409180097282e-05, 4.696202449849807e-05, 4.8079957196023315e-05, 4.919788989354856e-05, 5.031582259107381e-05, 5.143375165062025e-05, 5.25516843481455e-05, 5.366961704567075e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 15.0, 15.0, 8.0, 23.0, 15.0, 14.0, 17.0, 21.0, 24.0, 34.0, 37.0, 28.0, 34.0, 31.0, 39.0, 30.0, 35.0, 39.0, 45.0, 44.0, 33.0, 39.0, 33.0, 37.0, 41.0, 36.0, 23.0, 22.0, 26.0, 36.0, 18.0, 15.0, 4.0, 14.0, 11.0, 10.0, 5.0, 3.0, 6.0, 4.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.304813385009766e-06, -5.123205482959747e-06, -4.941597580909729e-06, -4.759989678859711e-06, -4.578381776809692e-06, -4.396773874759674e-06, -4.215165972709656e-06, -4.0335580706596375e-06, -3.851950168609619e-06, -3.670342266559601e-06, -3.4887343645095825e-06, -3.307126462459564e-06, -3.125518560409546e-06, -2.9439106583595276e-06, -2.7623027563095093e-06, -2.580694854259491e-06, -2.3990869522094727e-06, -2.2174790501594543e-06, -2.035871148109436e-06, -1.8542632460594177e-06, -1.6726553440093994e-06, -1.491047441959381e-06, -1.3094395399093628e-06, -1.1278316378593445e-06, -9.462237358093262e-07, -7.646158337593079e-07, -5.830079317092896e-07, -4.0140002965927124e-07, -2.1979212760925293e-07, -3.818422555923462e-08, 1.434236764907837e-07, 3.25031578540802e-07, 5.066394805908203e-07, 6.882473826408386e-07, 8.698552846908569e-07, 1.0514631867408752e-06, 1.2330710887908936e-06, 1.4146789908409119e-06, 1.5962868928909302e-06, 1.7778947949409485e-06, 1.959502696990967e-06, 2.141110599040985e-06, 2.3227185010910034e-06, 2.5043264031410217e-06, 2.68593430519104e-06, 2.8675422072410583e-06, 3.0491501092910767e-06, 3.230758011341095e-06, 3.4123659133911133e-06, 3.5939738154411316e-06, 3.77558171749115e-06, 3.957189619541168e-06, 4.1387975215911865e-06, 4.320405423641205e-06, 4.502013325691223e-06, 4.6836212277412415e-06, 4.86522912979126e-06, 5.046837031841278e-06, 5.228444933891296e-06, 5.410052835941315e-06, 5.591660737991333e-06, 5.773268640041351e-06, 5.95487654209137e-06, 6.136484444141388e-06, 6.318092346191406e-06]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 3.0, 7.0, 6.0, 7.0, 19.0, 26.0, 17.0, 34.0, 32.0, 38.0, 37.0, 30.0, 29.0, 46.0, 27.0, 48.0, 37.0, 55.0, 52.0, 39.0, 33.0, 35.0, 34.0, 35.0, 36.0, 30.0, 28.0, 27.0, 26.0, 22.0, 10.0, 12.0, 13.0, 11.0, 9.0, 11.0, 3.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5830078125, -1.5199432373046875, -1.456878662109375, -1.3938140869140625, -1.33074951171875, -1.2676849365234375, -1.204620361328125, -1.1415557861328125, -1.0784912109375, -1.0154266357421875, -0.952362060546875, -0.8892974853515625, -0.82623291015625, -0.7631683349609375, -0.700103759765625, -0.6370391845703125, -0.573974609375, -0.5109100341796875, -0.447845458984375, -0.3847808837890625, -0.32171630859375, -0.2586517333984375, -0.195587158203125, -0.1325225830078125, -0.0694580078125, -0.0063934326171875, 0.056671142578125, 0.1197357177734375, 0.18280029296875, 0.2458648681640625, 0.308929443359375, 0.3719940185546875, 0.43505859375, 0.4981231689453125, 0.561187744140625, 0.6242523193359375, 0.68731689453125, 0.7503814697265625, 0.813446044921875, 0.8765106201171875, 0.9395751953125, 1.0026397705078125, 1.065704345703125, 1.1287689208984375, 1.19183349609375, 1.2548980712890625, 1.317962646484375, 1.3810272216796875, 1.444091796875, 1.5071563720703125, 1.570220947265625, 1.6332855224609375, 1.69635009765625, 1.7594146728515625, 1.822479248046875, 1.8855438232421875, 1.9486083984375, 2.0116729736328125, 2.074737548828125, 2.1378021240234375, 2.20086669921875, 2.2639312744140625, 2.326995849609375, 2.3900604248046875, 2.453125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 7.0, 13.0, 15.0, 25.0, 43.0, 65.0, 106.0, 193.0, 373.0, 843.0, 2088.0, 5587.0, 19486.0, 115592.0, 743174.0, 129921.0, 21367.0, 5842.0, 2041.0, 848.0, 376.0, 213.0, 110.0, 66.0, 48.0, 33.0, 24.0, 18.0, 6.0, 7.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.89984130859375, -3.7098388671875, -3.51983642578125, -3.329833984375, -3.13983154296875, -2.9498291015625, -2.75982666015625, -2.56982421875, -2.37982177734375, -2.1898193359375, -1.99981689453125, -1.809814453125, -1.61981201171875, -1.4298095703125, -1.23980712890625, -1.0498046875, -0.85980224609375, -0.6697998046875, -0.47979736328125, -0.289794921875, -0.09979248046875, 0.0902099609375, 0.28021240234375, 0.47021484375, 0.66021728515625, 0.8502197265625, 1.04022216796875, 1.230224609375, 1.42022705078125, 1.6102294921875, 1.80023193359375, 1.990234375, 2.18023681640625, 2.3702392578125, 2.56024169921875, 2.750244140625, 2.94024658203125, 3.1302490234375, 3.32025146484375, 3.51025390625, 3.70025634765625, 3.8902587890625, 4.08026123046875, 4.270263671875, 4.46026611328125, 4.6502685546875, 4.84027099609375, 5.0302734375, 5.22027587890625, 5.4102783203125, 5.60028076171875, 5.790283203125, 5.98028564453125, 6.1702880859375, 6.36029052734375, 6.55029296875, 6.74029541015625, 6.9302978515625, 7.12030029296875, 7.310302734375, 7.50030517578125, 7.6903076171875, 7.88031005859375, 8.0703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 11.0, 9.0, 10.0, 8.0, 17.0, 20.0, 17.0, 27.0, 35.0, 28.0, 44.0, 36.0, 39.0, 52.0, 58.0, 77.0, 119.0, 1835.0, 103.0, 62.0, 63.0, 47.0, 35.0, 35.0, 37.0, 34.0, 33.0, 30.0, 22.0, 23.0, 18.0, 13.0, 6.0, 14.0, 2.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.04254150390625, -6.8038330078125, -6.56512451171875, -6.326416015625, -6.08770751953125, -5.8489990234375, -5.61029052734375, -5.37158203125, -5.13287353515625, -4.8941650390625, -4.65545654296875, -4.416748046875, -4.17803955078125, -3.9393310546875, -3.70062255859375, -3.4619140625, -3.22320556640625, -2.9844970703125, -2.74578857421875, -2.507080078125, -2.26837158203125, -2.0296630859375, -1.79095458984375, -1.55224609375, -1.31353759765625, -1.0748291015625, -0.83612060546875, -0.597412109375, -0.35870361328125, -0.1199951171875, 0.11871337890625, 0.357421875, 0.59613037109375, 0.8348388671875, 1.07354736328125, 1.312255859375, 1.55096435546875, 1.7896728515625, 2.02838134765625, 2.26708984375, 2.50579833984375, 2.7445068359375, 2.98321533203125, 3.221923828125, 3.46063232421875, 3.6993408203125, 3.93804931640625, 4.1767578125, 4.41546630859375, 4.6541748046875, 4.89288330078125, 5.131591796875, 5.37030029296875, 5.6090087890625, 5.84771728515625, 6.08642578125, 6.32513427734375, 6.5638427734375, 6.80255126953125, 7.041259765625, 7.27996826171875, 7.5186767578125, 7.75738525390625, 7.99609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 10.0, 12.0, 14.0, 18.0, 25.0, 12.0, 29.0, 39.0, 48.0, 55.0, 85.0, 146.0, 350.0, 1023.0, 5282.0, 67635.0, 3001173.0, 62899.0, 4977.0, 1002.0, 336.0, 167.0, 97.0, 59.0, 34.0, 39.0, 24.0, 17.0, 24.0, 9.0, 13.0, 9.0, 11.0, 7.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7265625, -15.2569580078125, -14.787353515625, -14.3177490234375, -13.84814453125, -13.3785400390625, -12.908935546875, -12.4393310546875, -11.9697265625, -11.5001220703125, -11.030517578125, -10.5609130859375, -10.09130859375, -9.6217041015625, -9.152099609375, -8.6824951171875, -8.212890625, -7.7432861328125, -7.273681640625, -6.8040771484375, -6.33447265625, -5.8648681640625, -5.395263671875, -4.9256591796875, -4.4560546875, -3.9864501953125, -3.516845703125, -3.0472412109375, -2.57763671875, -2.1080322265625, -1.638427734375, -1.1688232421875, -0.69921875, -0.2296142578125, 0.239990234375, 0.7095947265625, 1.17919921875, 1.6488037109375, 2.118408203125, 2.5880126953125, 3.0576171875, 3.5272216796875, 3.996826171875, 4.4664306640625, 4.93603515625, 5.4056396484375, 5.875244140625, 6.3448486328125, 6.814453125, 7.2840576171875, 7.753662109375, 8.2232666015625, 8.69287109375, 9.1624755859375, 9.632080078125, 10.1016845703125, 10.5712890625, 11.0408935546875, 11.510498046875, 11.9801025390625, 12.44970703125, 12.9193115234375, 13.388916015625, 13.8585205078125, 14.328125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 25.0, 57.0, 119.0, 216.0, 241.0, 174.0, 93.0, 51.0, 15.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.216583251953125, -18.485082626342773, -17.753582000732422, -17.02208137512207, -16.29058074951172, -15.559080123901367, -14.827579498291016, -14.096078872680664, -13.364578247070312, -12.633077621459961, -11.90157699584961, -11.170076370239258, -10.438575744628906, -9.707075119018555, -8.975574493408203, -8.244073867797852, -7.5125732421875, -6.781072616577148, -6.049571990966797, -5.318071365356445, -4.586570739746094, -3.855070114135742, -3.1235694885253906, -2.392068862915039, -1.6605682373046875, -0.9290676116943359, -0.19756698608398438, 0.5339336395263672, 1.2654342651367188, 1.9969348907470703, 2.728435516357422, 3.4599361419677734, 4.191434860229492, 4.922935485839844, 5.654436111450195, 6.385936737060547, 7.117437362670898, 7.84893798828125, 8.580438613891602, 9.311939239501953, 10.043439865112305, 10.774940490722656, 11.506441116333008, 12.23794174194336, 12.969442367553711, 13.700942993164062, 14.432443618774414, 15.163944244384766, 15.895444869995117, 16.62694549560547, 17.35844612121582, 18.089946746826172, 18.821447372436523, 19.552947998046875, 20.284448623657227, 21.015949249267578, 21.74744987487793, 22.47895050048828, 23.210451126098633, 23.941951751708984, 24.673452377319336, 25.404953002929688, 26.13645362854004, 26.86795425415039, 27.599454879760742]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 8.0, 3.0, 13.0, 10.0, 22.0, 21.0, 27.0, 26.0, 25.0, 42.0, 28.0, 40.0, 30.0, 23.0, 39.0, 44.0, 47.0, 35.0, 32.0, 33.0, 32.0, 31.0, 37.0, 43.0, 41.0, 35.0, 21.0, 27.0, 13.0, 24.0, 27.0, 16.0, 15.0, 16.0, 13.0, 12.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.442291259765625, -21.69692611694336, -20.951560974121094, -20.206195831298828, -19.46082878112793, -18.715463638305664, -17.9700984954834, -17.224733352661133, -16.479368209838867, -15.734003067016602, -14.98863697052002, -14.243271827697754, -13.497906684875488, -12.752540588378906, -12.00717544555664, -11.261810302734375, -10.516444206237793, -9.771079063415527, -9.025712966918945, -8.28034782409668, -7.534982681274414, -6.78961706161499, -6.044251441955566, -5.298886299133301, -4.553520679473877, -3.8081552982330322, -3.0627899169921875, -2.3174242973327637, -1.572058916091919, -0.8266935348510742, -0.08132791519165039, 0.6640372276306152, 1.409402847290039, 2.154768228530884, 2.9001336097717285, 3.6454992294311523, 4.390864372253418, 5.136229991912842, 5.881595611572266, 6.626960754394531, 7.372326374053955, 8.117691993713379, 8.863057136535645, 9.608423233032227, 10.353788375854492, 11.099153518676758, 11.844518661499023, 12.589883804321289, 13.335249900817871, 14.080615043640137, 14.825981140136719, 15.571346282958984, 16.31671142578125, 17.062076568603516, 17.80744171142578, 18.552806854248047, 19.298173904418945, 20.04353904724121, 20.788904190063477, 21.534271240234375, 22.27963638305664, 23.025001525878906, 23.770366668701172, 24.515731811523438, 25.261096954345703]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 9.0, 2.0, 2.0, 6.0, 3.0, 7.0, 7.0, 2.0, 7.0, 15.0, 24.0, 26.0, 27.0, 26.0, 44.0, 32.0, 34.0, 36.0, 30.0, 31.0, 42.0, 43.0, 41.0, 45.0, 45.0, 45.0, 35.0, 24.0, 42.0, 33.0, 31.0, 31.0, 24.0, 26.0, 22.0, 23.0, 11.0, 10.0, 12.0, 10.0, 12.0, 10.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5498046875, -1.4867401123046875, -1.423675537109375, -1.3606109619140625, -1.29754638671875, -1.2344818115234375, -1.171417236328125, -1.1083526611328125, -1.0452880859375, -0.9822235107421875, -0.919158935546875, -0.8560943603515625, -0.79302978515625, -0.7299652099609375, -0.666900634765625, -0.6038360595703125, -0.540771484375, -0.4777069091796875, -0.414642333984375, -0.3515777587890625, -0.28851318359375, -0.2254486083984375, -0.162384033203125, -0.0993194580078125, -0.0362548828125, 0.0268096923828125, 0.089874267578125, 0.1529388427734375, 0.21600341796875, 0.2790679931640625, 0.342132568359375, 0.4051971435546875, 0.46826171875, 0.5313262939453125, 0.594390869140625, 0.6574554443359375, 0.72052001953125, 0.7835845947265625, 0.846649169921875, 0.9097137451171875, 0.9727783203125, 1.0358428955078125, 1.098907470703125, 1.1619720458984375, 1.22503662109375, 1.2881011962890625, 1.351165771484375, 1.4142303466796875, 1.477294921875, 1.5403594970703125, 1.603424072265625, 1.6664886474609375, 1.72955322265625, 1.7926177978515625, 1.855682373046875, 1.9187469482421875, 1.9818115234375, 2.0448760986328125, 2.107940673828125, 2.1710052490234375, 2.23406982421875, 2.2971343994140625, 2.360198974609375, 2.4232635498046875, 2.486328125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 9.0, 11.0, 13.0, 18.0, 32.0, 33.0, 59.0, 65.0, 98.0, 148.0, 275.0, 560.0, 1393.0, 5093.0, 25415.0, 254784.0, 3473569.0, 388915.0, 33710.0, 6484.0, 1921.0, 723.0, 335.0, 176.0, 117.0, 80.0, 53.0, 50.0, 31.0, 12.0, 20.0, 19.0, 13.0, 12.0, 2.0, 3.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.3936767578125, -9.052978515625, -8.7122802734375, -8.37158203125, -8.0308837890625, -7.690185546875, -7.3494873046875, -7.0087890625, -6.6680908203125, -6.327392578125, -5.9866943359375, -5.64599609375, -5.3052978515625, -4.964599609375, -4.6239013671875, -4.283203125, -3.9425048828125, -3.601806640625, -3.2611083984375, -2.92041015625, -2.5797119140625, -2.239013671875, -1.8983154296875, -1.5576171875, -1.2169189453125, -0.876220703125, -0.5355224609375, -0.19482421875, 0.1458740234375, 0.486572265625, 0.8272705078125, 1.16796875, 1.5086669921875, 1.849365234375, 2.1900634765625, 2.53076171875, 2.8714599609375, 3.212158203125, 3.5528564453125, 3.8935546875, 4.2342529296875, 4.574951171875, 4.9156494140625, 5.25634765625, 5.5970458984375, 5.937744140625, 6.2784423828125, 6.619140625, 6.9598388671875, 7.300537109375, 7.6412353515625, 7.98193359375, 8.3226318359375, 8.663330078125, 9.0040283203125, 9.3447265625, 9.6854248046875, 10.026123046875, 10.3668212890625, 10.70751953125, 11.0482177734375, 11.388916015625, 11.7296142578125, 12.0703125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 8.0, 19.0, 17.0, 33.0, 52.0, 73.0, 103.0, 176.0, 269.0, 410.0, 650.0, 714.0, 558.0, 345.0, 224.0, 145.0, 88.0, 67.0, 33.0, 32.0, 14.0, 13.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.2216796875, -7.958984375, -7.6962890625, -7.43359375, -7.1708984375, -6.908203125, -6.6455078125, -6.3828125, -6.1201171875, -5.857421875, -5.5947265625, -5.33203125, -5.0693359375, -4.806640625, -4.5439453125, -4.28125, -4.0185546875, -3.755859375, -3.4931640625, -3.23046875, -2.9677734375, -2.705078125, -2.4423828125, -2.1796875, -1.9169921875, -1.654296875, -1.3916015625, -1.12890625, -0.8662109375, -0.603515625, -0.3408203125, -0.078125, 0.1845703125, 0.447265625, 0.7099609375, 0.97265625, 1.2353515625, 1.498046875, 1.7607421875, 2.0234375, 2.2861328125, 2.548828125, 2.8115234375, 3.07421875, 3.3369140625, 3.599609375, 3.8623046875, 4.125, 4.3876953125, 4.650390625, 4.9130859375, 5.17578125, 5.4384765625, 5.701171875, 5.9638671875, 6.2265625, 6.4892578125, 6.751953125, 7.0146484375, 7.27734375, 7.5400390625, 7.802734375, 8.0654296875, 8.328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 11.0, 25.0, 43.0, 79.0, 140.0, 269.0, 549.0, 1643.0, 8242.0, 104188.0, 3473102.0, 578379.0, 22840.0, 3078.0, 910.0, 380.0, 166.0, 103.0, 52.0, 26.0, 22.0, 12.0, 8.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-31.59375, -30.836669921875, -30.07958984375, -29.322509765625, -28.5654296875, -27.808349609375, -27.05126953125, -26.294189453125, -25.537109375, -24.780029296875, -24.02294921875, -23.265869140625, -22.5087890625, -21.751708984375, -20.99462890625, -20.237548828125, -19.48046875, -18.723388671875, -17.96630859375, -17.209228515625, -16.4521484375, -15.695068359375, -14.93798828125, -14.180908203125, -13.423828125, -12.666748046875, -11.90966796875, -11.152587890625, -10.3955078125, -9.638427734375, -8.88134765625, -8.124267578125, -7.3671875, -6.610107421875, -5.85302734375, -5.095947265625, -4.3388671875, -3.581787109375, -2.82470703125, -2.067626953125, -1.310546875, -0.553466796875, 0.20361328125, 0.960693359375, 1.7177734375, 2.474853515625, 3.23193359375, 3.989013671875, 4.74609375, 5.503173828125, 6.26025390625, 7.017333984375, 7.7744140625, 8.531494140625, 9.28857421875, 10.045654296875, 10.802734375, 11.559814453125, 12.31689453125, 13.073974609375, 13.8310546875, 14.588134765625, 15.34521484375, 16.102294921875, 16.859375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 9.0, 20.0, 35.0, 50.0, 74.0, 116.0, 136.0, 153.0, 135.0, 109.0, 79.0, 35.0, 32.0, 13.0, 9.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.623903274536133, -15.174619674682617, -13.725335121154785, -12.276050567626953, -10.826766967773438, -9.377483367919922, -7.92819881439209, -6.478914260864258, -5.029630661010742, -3.5803465843200684, -2.1310625076293945, -0.6817784309387207, 0.7675056457519531, 2.216789722442627, 3.666073799133301, 5.115358352661133, 6.564641952514648, 8.013925552368164, 9.463210105895996, 10.912494659423828, 12.361778259277344, 13.81106185913086, 15.260346412658691, 16.709630966186523, 18.15891456604004, 19.608198165893555, 21.057483673095703, 22.50676727294922, 23.956050872802734, 25.40533447265625, 26.854618072509766, 28.303903579711914, 29.753189086914062, 31.202472686767578, 32.651756286621094, 34.10103988647461, 35.550323486328125, 36.999610900878906, 38.44889450073242, 39.89817810058594, 41.34746170043945, 42.79674530029297, 44.246028900146484, 45.6953125, 47.14459991455078, 48.5938835144043, 50.04316711425781, 51.49245071411133, 52.941734313964844, 54.39101791381836, 55.840301513671875, 57.28958511352539, 58.738868713378906, 60.18815612792969, 61.6374397277832, 63.08672332763672, 64.5360107421875, 65.98529815673828, 67.43457794189453, 68.88386535644531, 70.33314514160156, 71.78243255615234, 73.2317123413086, 74.68099975585938, 76.13027954101562]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 14.0, 10.0, 10.0, 10.0, 16.0, 10.0, 16.0, 25.0, 27.0, 37.0, 27.0, 37.0, 31.0, 41.0, 38.0, 41.0, 40.0, 52.0, 45.0, 30.0, 44.0, 41.0, 44.0, 30.0, 40.0, 29.0, 30.0, 30.0, 25.0, 12.0, 22.0, 21.0, 14.0, 13.0, 7.0, 16.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.290603637695312, -22.636634826660156, -21.982666015625, -21.328697204589844, -20.674728393554688, -20.02075958251953, -19.366790771484375, -18.71282196044922, -18.058853149414062, -17.404884338378906, -16.75091552734375, -16.096946716308594, -15.442977905273438, -14.789009094238281, -14.135039329528809, -13.481070518493652, -12.82710075378418, -12.173131942749023, -11.519163131713867, -10.865194320678711, -10.211225509643555, -9.557256698608398, -8.903286933898926, -8.24931812286377, -7.595349311828613, -6.941380500793457, -6.287411689758301, -5.633442401885986, -4.97947359085083, -4.325504779815674, -3.6715357303619385, -3.017566680908203, -2.363597869873047, -1.709628939628601, -1.0556600093841553, -0.4016910791397095, 0.25227785110473633, 0.9062466621398926, 1.560215711593628, 2.2141847610473633, 2.8681535720825195, 3.522122383117676, 4.176091194152832, 4.8300604820251465, 5.484029293060303, 6.137998104095459, 6.791967391967773, 7.44593620300293, 8.099905014038086, 8.753873825073242, 9.407842636108398, 10.061811447143555, 10.715780258178711, 11.369749069213867, 12.02371883392334, 12.677687644958496, 13.331656455993652, 13.985625267028809, 14.639594078063965, 15.293562889099121, 15.947532653808594, 16.60150146484375, 17.255470275878906, 17.909439086914062, 18.56340789794922]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 3.0, 9.0, 6.0, 14.0, 13.0, 9.0, 22.0, 20.0, 27.0, 32.0, 32.0, 27.0, 38.0, 40.0, 41.0, 37.0, 48.0, 57.0, 43.0, 35.0, 37.0, 38.0, 36.0, 41.0, 36.0, 31.0, 21.0, 34.0, 27.0, 18.0, 19.0, 13.0, 15.0, 14.0, 10.0, 8.0, 3.0, 8.0, 12.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.5928192138671875, -1.526458740234375, -1.4600982666015625, -1.39373779296875, -1.3273773193359375, -1.261016845703125, -1.1946563720703125, -1.1282958984375, -1.0619354248046875, -0.995574951171875, -0.9292144775390625, -0.86285400390625, -0.7964935302734375, -0.730133056640625, -0.6637725830078125, -0.597412109375, -0.5310516357421875, -0.464691162109375, -0.3983306884765625, -0.33197021484375, -0.2656097412109375, -0.199249267578125, -0.1328887939453125, -0.0665283203125, -0.0001678466796875, 0.066192626953125, 0.1325531005859375, 0.19891357421875, 0.2652740478515625, 0.331634521484375, 0.3979949951171875, 0.46435546875, 0.5307159423828125, 0.597076416015625, 0.6634368896484375, 0.72979736328125, 0.7961578369140625, 0.862518310546875, 0.9288787841796875, 0.9952392578125, 1.0615997314453125, 1.127960205078125, 1.1943206787109375, 1.26068115234375, 1.3270416259765625, 1.393402099609375, 1.4597625732421875, 1.526123046875, 1.5924835205078125, 1.658843994140625, 1.7252044677734375, 1.79156494140625, 1.8579254150390625, 1.924285888671875, 1.9906463623046875, 2.0570068359375, 2.1233673095703125, 2.189727783203125, 2.2560882568359375, 2.32244873046875, 2.3888092041015625, 2.455169677734375, 2.5215301513671875, 2.587890625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 7.0, 12.0, 12.0, 18.0, 23.0, 33.0, 41.0, 73.0, 87.0, 138.0, 201.0, 292.0, 417.0, 650.0, 1007.0, 1561.0, 2374.0, 3749.0, 5969.0, 9694.0, 15832.0, 26641.0, 46284.0, 85978.0, 186014.0, 353279.0, 141344.0, 69830.0, 38482.0, 22407.0, 13343.0, 8229.0, 5178.0, 3223.0, 2112.0, 1354.0, 846.0, 571.0, 416.0, 279.0, 186.0, 121.0, 78.0, 61.0, 36.0, 27.0, 16.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.2352294921875, -0.22857284545898438, -0.22191619873046875, -0.21525955200195312, -0.2086029052734375, -0.20194625854492188, -0.19528961181640625, -0.18863296508789062, -0.181976318359375, -0.17531967163085938, -0.16866302490234375, -0.16200637817382812, -0.1553497314453125, -0.14869308471679688, -0.14203643798828125, -0.13537979125976562, -0.12872314453125, -0.12206649780273438, -0.11540985107421875, -0.10875320434570312, -0.1020965576171875, -0.09543991088867188, -0.08878326416015625, -0.08212661743164062, -0.075469970703125, -0.06881332397460938, -0.06215667724609375, -0.055500030517578125, -0.0488433837890625, -0.042186737060546875, -0.03553009033203125, -0.028873443603515625, -0.022216796875, -0.015560150146484375, -0.00890350341796875, -0.002246856689453125, 0.0044097900390625, 0.011066436767578125, 0.01772308349609375, 0.024379730224609375, 0.031036376953125, 0.037693023681640625, 0.04434967041015625, 0.051006317138671875, 0.0576629638671875, 0.06431961059570312, 0.07097625732421875, 0.07763290405273438, 0.08428955078125, 0.09094619750976562, 0.09760284423828125, 0.10425949096679688, 0.1109161376953125, 0.11757278442382812, 0.12422943115234375, 0.13088607788085938, 0.137542724609375, 0.14419937133789062, 0.15085601806640625, 0.15751266479492188, 0.1641693115234375, 0.17082595825195312, 0.17748260498046875, 0.18413925170898438, 0.1907958984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 7.0, 7.0, 9.0, 7.0, 8.0, 8.0, 10.0, 13.0, 16.0, 9.0, 20.0, 28.0, 21.0, 37.0, 36.0, 28.0, 40.0, 32.0, 40.0, 38.0, 41.0, 1056.0, 43.0, 44.0, 56.0, 34.0, 42.0, 35.0, 34.0, 28.0, 31.0, 23.0, 22.0, 21.0, 15.0, 11.0, 10.0, 21.0, 10.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.5107269287109375, -1.461883544921875, -1.4130401611328125, -1.36419677734375, -1.3153533935546875, -1.266510009765625, -1.2176666259765625, -1.1688232421875, -1.1199798583984375, -1.071136474609375, -1.0222930908203125, -0.97344970703125, -0.9246063232421875, -0.875762939453125, -0.8269195556640625, -0.778076171875, -0.7292327880859375, -0.680389404296875, -0.6315460205078125, -0.58270263671875, -0.5338592529296875, -0.485015869140625, -0.4361724853515625, -0.3873291015625, -0.3384857177734375, -0.289642333984375, -0.2407989501953125, -0.19195556640625, -0.1431121826171875, -0.094268798828125, -0.0454254150390625, 0.00341796875, 0.0522613525390625, 0.101104736328125, 0.1499481201171875, 0.19879150390625, 0.2476348876953125, 0.296478271484375, 0.3453216552734375, 0.3941650390625, 0.4430084228515625, 0.491851806640625, 0.5406951904296875, 0.58953857421875, 0.6383819580078125, 0.687225341796875, 0.7360687255859375, 0.784912109375, 0.8337554931640625, 0.882598876953125, 0.9314422607421875, 0.98028564453125, 1.0291290283203125, 1.077972412109375, 1.1268157958984375, 1.1756591796875, 1.2245025634765625, 1.273345947265625, 1.3221893310546875, 1.37103271484375, 1.4198760986328125, 1.468719482421875, 1.5175628662109375, 1.56640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 7.0, 13.0, 17.0, 22.0, 44.0, 69.0, 82.0, 137.0, 208.0, 258.0, 404.0, 641.0, 955.0, 1406.0, 2067.0, 3081.0, 4838.0, 7283.0, 11706.0, 18659.0, 31442.0, 56150.0, 109408.0, 1362528.0, 256720.0, 98854.0, 51826.0, 29461.0, 17578.0, 10957.0, 6922.0, 4437.0, 2937.0, 2016.0, 1309.0, 847.0, 589.0, 421.0, 278.0, 165.0, 136.0, 84.0, 49.0, 45.0, 22.0, 22.0, 13.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.103759765625, -0.1005105972290039, -0.09726142883300781, -0.09401226043701172, -0.09076309204101562, -0.08751392364501953, -0.08426475524902344, -0.08101558685302734, -0.07776641845703125, -0.07451725006103516, -0.07126808166503906, -0.06801891326904297, -0.06476974487304688, -0.06152057647705078, -0.05827140808105469, -0.055022239685058594, -0.0517730712890625, -0.048523902893066406, -0.04527473449707031, -0.04202556610107422, -0.038776397705078125, -0.03552722930908203, -0.03227806091308594, -0.029028892517089844, -0.02577972412109375, -0.022530555725097656, -0.019281387329101562, -0.01603221893310547, -0.012783050537109375, -0.009533882141113281, -0.0062847137451171875, -0.0030355453491210938, 0.000213623046875, 0.0034627914428710938, 0.0067119598388671875, 0.009961128234863281, 0.013210296630859375, 0.01645946502685547, 0.019708633422851562, 0.022957801818847656, 0.02620697021484375, 0.029456138610839844, 0.03270530700683594, 0.03595447540283203, 0.039203643798828125, 0.04245281219482422, 0.04570198059082031, 0.048951148986816406, 0.0522003173828125, 0.055449485778808594, 0.05869865417480469, 0.06194782257080078, 0.06519699096679688, 0.06844615936279297, 0.07169532775878906, 0.07494449615478516, 0.07819366455078125, 0.08144283294677734, 0.08469200134277344, 0.08794116973876953, 0.09119033813476562, 0.09443950653076172, 0.09768867492675781, 0.1009378433227539, 0.10418701171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 7.0, 3.0, 12.0, 9.0, 16.0, 7.0, 11.0, 22.0, 16.0, 29.0, 21.0, 38.0, 57.0, 94.0, 146.0, 119.0, 81.0, 62.0, 48.0, 36.0, 30.0, 37.0, 16.0, 13.0, 8.0, 7.0, 9.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.5676021575927734e-05, -1.5266239643096924e-05, -1.4856457710266113e-05, -1.4446675777435303e-05, -1.4036893844604492e-05, -1.3627111911773682e-05, -1.3217329978942871e-05, -1.280754804611206e-05, -1.239776611328125e-05, -1.198798418045044e-05, -1.1578202247619629e-05, -1.1168420314788818e-05, -1.0758638381958008e-05, -1.0348856449127197e-05, -9.939074516296387e-06, -9.529292583465576e-06, -9.119510650634766e-06, -8.709728717803955e-06, -8.299946784973145e-06, -7.890164852142334e-06, -7.4803829193115234e-06, -7.070600986480713e-06, -6.660819053649902e-06, -6.251037120819092e-06, -5.841255187988281e-06, -5.431473255157471e-06, -5.02169132232666e-06, -4.61190938949585e-06, -4.202127456665039e-06, -3.7923455238342285e-06, -3.382563591003418e-06, -2.9727816581726074e-06, -2.562999725341797e-06, -2.1532177925109863e-06, -1.7434358596801758e-06, -1.3336539268493652e-06, -9.238719940185547e-07, -5.140900611877441e-07, -1.043081283569336e-07, 3.0547380447387695e-07, 7.152557373046875e-07, 1.125037670135498e-06, 1.5348196029663086e-06, 1.944601535797119e-06, 2.3543834686279297e-06, 2.7641654014587402e-06, 3.1739473342895508e-06, 3.5837292671203613e-06, 3.993511199951172e-06, 4.403293132781982e-06, 4.813075065612793e-06, 5.2228569984436035e-06, 5.632638931274414e-06, 6.042420864105225e-06, 6.452202796936035e-06, 6.861984729766846e-06, 7.271766662597656e-06, 7.681548595428467e-06, 8.091330528259277e-06, 8.501112461090088e-06, 8.910894393920898e-06, 9.320676326751709e-06, 9.73045825958252e-06, 1.014024019241333e-05, 1.055002212524414e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 17.0, 13.0, 22.0, 21.0, 28.0, 26.0, 49.0, 67.0, 97.0, 141.0, 400.0, 1404.0, 8119.0, 66594.0, 822529.0, 132516.0, 13216.0, 2136.0, 519.0, 210.0, 109.0, 75.0, 55.0, 40.0, 21.0, 22.0, 23.0, 15.0, 11.0, 4.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019299983978271484, -0.00018546916544437408, -0.00017793849110603333, -0.00017040781676769257, -0.0001628771424293518, -0.00015534646809101105, -0.0001478157937526703, -0.00014028511941432953, -0.00013275444507598877, -0.000125223770737648, -0.00011769309639930725, -0.00011016242206096649, -0.00010263174772262573, -9.510107338428497e-05, -8.757039904594421e-05, -8.003972470760345e-05, -7.25090503692627e-05, -6.497837603092194e-05, -5.744770169258118e-05, -4.991702735424042e-05, -4.238635301589966e-05, -3.48556786775589e-05, -2.732500433921814e-05, -1.979433000087738e-05, -1.2263655662536621e-05, -4.732981324195862e-06, 2.7976930141448975e-06, 1.0328367352485657e-05, 1.7859041690826416e-05, 2.5389716029167175e-05, 3.2920390367507935e-05, 4.0451064705848694e-05, 4.798173904418945e-05, 5.551241338253021e-05, 6.304308772087097e-05, 7.057376205921173e-05, 7.810443639755249e-05, 8.563511073589325e-05, 9.316578507423401e-05, 0.00010069645941257477, 0.00010822713375091553, 0.00011575780808925629, 0.00012328848242759705, 0.0001308191567659378, 0.00013834983110427856, 0.00014588050544261932, 0.00015341117978096008, 0.00016094185411930084, 0.0001684725284576416, 0.00017600320279598236, 0.00018353387713432312, 0.00019106455147266388, 0.00019859522581100464, 0.0002061259001493454, 0.00021365657448768616, 0.00022118724882602692, 0.00022871792316436768, 0.00023624859750270844, 0.0002437792718410492, 0.00025130994617938995, 0.0002588406205177307, 0.00026637129485607147, 0.00027390196919441223, 0.000281432643532753, 0.00028896331787109375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 5.0, 10.0, 13.0, 28.0, 79.0, 138.0, 261.0, 252.0, 116.0, 47.0, 27.0, 15.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.832100214320235e-05, -5.7175857364200056e-05, -5.603071258519776e-05, -5.488556780619547e-05, -5.3740423027193174e-05, -5.259527824819088e-05, -5.145012983120978e-05, -5.0304985052207485e-05, -4.915984027320519e-05, -4.80146954942029e-05, -4.68695507152006e-05, -4.572440593619831e-05, -4.4579261157196015e-05, -4.3434112740214914e-05, -4.228897159919143e-05, -4.1143823182210326e-05, -3.999868204118684e-05, -3.8853537262184545e-05, -3.770839248318225e-05, -3.656324770417996e-05, -3.5418102925177664e-05, -3.427295450819656e-05, -3.3127813367173076e-05, -3.1982664950191975e-05, -3.083752017118968e-05, -2.9692375392187387e-05, -2.8547230613185093e-05, -2.74020858341828e-05, -2.62569392361911e-05, -2.5111794457188807e-05, -2.3966649678186513e-05, -2.2821503080194816e-05, -2.1676358301192522e-05, -2.0531213522190228e-05, -1.9386068743187934e-05, -1.824092396418564e-05, -1.7095777366193943e-05, -1.595063258719165e-05, -1.4805487808189355e-05, -1.3660342119692359e-05, -1.2515197340690065e-05, -1.1370052561687771e-05, -1.0224906873190776e-05, -9.079762094188482e-06, -7.934617315186188e-06, -6.789471626689192e-06, -5.644326847686898e-06, -4.499181159189902e-06, -3.3540363801876083e-06, -2.2088911464379635e-06, -1.063746140061994e-06, 8.13988663139753e-08, 1.2265441000636201e-06, 2.371689333813265e-06, 3.516834112815559e-06, 4.661979801312555e-06, 5.8071245803148486e-06, 6.952269814064493e-06, 8.097415047814138e-06, 9.242559826816432e-06, 1.0387704605818726e-05, 1.1532850294315722e-05, 1.2677995073318016e-05, 1.3823140761815012e-05, 1.4968285540817305e-05]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 12.0, 10.0, 16.0, 13.0, 15.0, 16.0, 16.0, 17.0, 22.0, 26.0, 18.0, 29.0, 35.0, 15.0, 43.0, 45.0, 41.0, 32.0, 38.0, 42.0, 20.0, 43.0, 43.0, 49.0, 33.0, 34.0, 35.0, 19.0, 27.0, 24.0, 20.0, 20.0, 13.0, 21.0, 13.0, 13.0, 12.0, 11.0, 10.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.827976226806641e-06, -4.657544195652008e-06, -4.4871121644973755e-06, -4.316680133342743e-06, -4.14624810218811e-06, -3.975816071033478e-06, -3.8053840398788452e-06, -3.6349520087242126e-06, -3.46451997756958e-06, -3.2940879464149475e-06, -3.123655915260315e-06, -2.9532238841056824e-06, -2.78279185295105e-06, -2.6123598217964172e-06, -2.4419277906417847e-06, -2.271495759487152e-06, -2.1010637283325195e-06, -1.930631697177887e-06, -1.7601996660232544e-06, -1.5897676348686218e-06, -1.4193356037139893e-06, -1.2489035725593567e-06, -1.0784715414047241e-06, -9.080395102500916e-07, -7.37607479095459e-07, -5.671754479408264e-07, -3.9674341678619385e-07, -2.2631138563156128e-07, -5.587935447692871e-08, 1.1455267667770386e-07, 2.849847078323364e-07, 4.55416738986969e-07, 6.258487701416016e-07, 7.962808012962341e-07, 9.667128324508667e-07, 1.1371448636054993e-06, 1.3075768947601318e-06, 1.4780089259147644e-06, 1.648440957069397e-06, 1.8188729882240295e-06, 1.989305019378662e-06, 2.1597370505332947e-06, 2.3301690816879272e-06, 2.50060111284256e-06, 2.6710331439971924e-06, 2.841465175151825e-06, 3.0118972063064575e-06, 3.18232923746109e-06, 3.3527612686157227e-06, 3.5231932997703552e-06, 3.693625330924988e-06, 3.86405736207962e-06, 4.034489393234253e-06, 4.2049214243888855e-06, 4.375353455543518e-06, 4.545785486698151e-06, 4.716217517852783e-06, 4.886649549007416e-06, 5.057081580162048e-06, 5.227513611316681e-06, 5.3979456424713135e-06, 5.568377673625946e-06, 5.738809704780579e-06, 5.909241735935211e-06, 6.079673767089844e-06]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 3.0, 9.0, 6.0, 14.0, 13.0, 9.0, 22.0, 20.0, 27.0, 32.0, 32.0, 27.0, 38.0, 40.0, 41.0, 37.0, 48.0, 57.0, 43.0, 35.0, 37.0, 38.0, 36.0, 41.0, 36.0, 31.0, 21.0, 34.0, 27.0, 18.0, 19.0, 13.0, 15.0, 14.0, 10.0, 8.0, 3.0, 8.0, 12.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.5928192138671875, -1.526458740234375, -1.4600982666015625, -1.39373779296875, -1.3273773193359375, -1.261016845703125, -1.1946563720703125, -1.1282958984375, -1.0619354248046875, -0.995574951171875, -0.9292144775390625, -0.86285400390625, -0.7964935302734375, -0.730133056640625, -0.6637725830078125, -0.597412109375, -0.5310516357421875, -0.464691162109375, -0.3983306884765625, -0.33197021484375, -0.2656097412109375, -0.199249267578125, -0.1328887939453125, -0.0665283203125, -0.0001678466796875, 0.066192626953125, 0.1325531005859375, 0.19891357421875, 0.2652740478515625, 0.331634521484375, 0.3979949951171875, 0.46435546875, 0.5307159423828125, 0.597076416015625, 0.6634368896484375, 0.72979736328125, 0.7961578369140625, 0.862518310546875, 0.9288787841796875, 0.9952392578125, 1.0615997314453125, 1.127960205078125, 1.1943206787109375, 1.26068115234375, 1.3270416259765625, 1.393402099609375, 1.4597625732421875, 1.526123046875, 1.5924835205078125, 1.658843994140625, 1.7252044677734375, 1.79156494140625, 1.8579254150390625, 1.924285888671875, 1.9906463623046875, 2.0570068359375, 2.1233673095703125, 2.189727783203125, 2.2560882568359375, 2.32244873046875, 2.3888092041015625, 2.455169677734375, 2.5215301513671875, 2.587890625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 9.0, 13.0, 21.0, 27.0, 38.0, 43.0, 75.0, 97.0, 157.0, 285.0, 508.0, 991.0, 1960.0, 4551.0, 10996.0, 29911.0, 109943.0, 586480.0, 224978.0, 49359.0, 16161.0, 6360.0, 2688.0, 1336.0, 664.0, 359.0, 214.0, 98.0, 75.0, 46.0, 30.0, 20.0, 20.0, 13.0, 13.0, 6.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.55169677734375, -2.4393310546875, -2.32696533203125, -2.214599609375, -2.10223388671875, -1.9898681640625, -1.87750244140625, -1.76513671875, -1.65277099609375, -1.5404052734375, -1.42803955078125, -1.315673828125, -1.20330810546875, -1.0909423828125, -0.97857666015625, -0.8662109375, -0.75384521484375, -0.6414794921875, -0.52911376953125, -0.416748046875, -0.30438232421875, -0.1920166015625, -0.07965087890625, 0.03271484375, 0.14508056640625, 0.2574462890625, 0.36981201171875, 0.482177734375, 0.59454345703125, 0.7069091796875, 0.81927490234375, 0.931640625, 1.04400634765625, 1.1563720703125, 1.26873779296875, 1.381103515625, 1.49346923828125, 1.6058349609375, 1.71820068359375, 1.83056640625, 1.94293212890625, 2.0552978515625, 2.16766357421875, 2.280029296875, 2.39239501953125, 2.5047607421875, 2.61712646484375, 2.7294921875, 2.84185791015625, 2.9542236328125, 3.06658935546875, 3.178955078125, 3.29132080078125, 3.4036865234375, 3.51605224609375, 3.62841796875, 3.74078369140625, 3.8531494140625, 3.96551513671875, 4.077880859375, 4.19024658203125, 4.3026123046875, 4.41497802734375, 4.52734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 4.0, 8.0, 6.0, 7.0, 17.0, 10.0, 18.0, 26.0, 20.0, 36.0, 30.0, 25.0, 37.0, 54.0, 55.0, 58.0, 140.0, 1850.0, 179.0, 62.0, 51.0, 48.0, 36.0, 45.0, 39.0, 35.0, 21.0, 31.0, 19.0, 14.0, 12.0, 16.0, 5.0, 5.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.14178466796875, -6.8734130859375, -6.60504150390625, -6.336669921875, -6.06829833984375, -5.7999267578125, -5.53155517578125, -5.26318359375, -4.99481201171875, -4.7264404296875, -4.45806884765625, -4.189697265625, -3.92132568359375, -3.6529541015625, -3.38458251953125, -3.1162109375, -2.84783935546875, -2.5794677734375, -2.31109619140625, -2.042724609375, -1.77435302734375, -1.5059814453125, -1.23760986328125, -0.96923828125, -0.70086669921875, -0.4324951171875, -0.16412353515625, 0.104248046875, 0.37261962890625, 0.6409912109375, 0.90936279296875, 1.177734375, 1.44610595703125, 1.7144775390625, 1.98284912109375, 2.251220703125, 2.51959228515625, 2.7879638671875, 3.05633544921875, 3.32470703125, 3.59307861328125, 3.8614501953125, 4.12982177734375, 4.398193359375, 4.66656494140625, 4.9349365234375, 5.20330810546875, 5.4716796875, 5.74005126953125, 6.0084228515625, 6.27679443359375, 6.545166015625, 6.81353759765625, 7.0819091796875, 7.35028076171875, 7.61865234375, 7.88702392578125, 8.1553955078125, 8.42376708984375, 8.692138671875, 8.96051025390625, 9.2288818359375, 9.49725341796875, 9.765625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 4.0, 7.0, 12.0, 13.0, 10.0, 17.0, 14.0, 25.0, 28.0, 38.0, 52.0, 77.0, 109.0, 169.0, 340.0, 889.0, 3293.0, 18006.0, 258866.0, 2814492.0, 40433.0, 6194.0, 1460.0, 493.0, 240.0, 112.0, 66.0, 53.0, 39.0, 27.0, 25.0, 23.0, 9.0, 12.0, 8.0, 11.0, 6.0, 6.0, 6.0, 5.0, 8.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7421875, -11.388427734375, -11.03466796875, -10.680908203125, -10.3271484375, -9.973388671875, -9.61962890625, -9.265869140625, -8.912109375, -8.558349609375, -8.20458984375, -7.850830078125, -7.4970703125, -7.143310546875, -6.78955078125, -6.435791015625, -6.08203125, -5.728271484375, -5.37451171875, -5.020751953125, -4.6669921875, -4.313232421875, -3.95947265625, -3.605712890625, -3.251953125, -2.898193359375, -2.54443359375, -2.190673828125, -1.8369140625, -1.483154296875, -1.12939453125, -0.775634765625, -0.421875, -0.068115234375, 0.28564453125, 0.639404296875, 0.9931640625, 1.346923828125, 1.70068359375, 2.054443359375, 2.408203125, 2.761962890625, 3.11572265625, 3.469482421875, 3.8232421875, 4.177001953125, 4.53076171875, 4.884521484375, 5.23828125, 5.592041015625, 5.94580078125, 6.299560546875, 6.6533203125, 7.007080078125, 7.36083984375, 7.714599609375, 8.068359375, 8.422119140625, 8.77587890625, 9.129638671875, 9.4833984375, 9.837158203125, 10.19091796875, 10.544677734375, 10.8984375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [130.0, 865.0, 23.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.288099765777588, -1.67124605178833, 2.9456076622009277, 7.5624613761901855, 12.179315567016602, 16.79616928100586, 21.413022994995117, 26.029878616333008, 30.646730422973633, 35.26358413696289, 39.88043975830078, 44.497291564941406, 49.11414337158203, 53.73099899291992, 58.34785461425781, 62.96470642089844, 67.58155822753906, 72.19841003417969, 76.81526184082031, 81.43212127685547, 86.0489730834961, 90.66582489013672, 95.28268432617188, 99.8995361328125, 104.51638793945312, 109.13323974609375, 113.75009155273438, 118.36695098876953, 122.98380279541016, 127.60065460205078, 132.21751403808594, 136.83436584472656, 141.45123291015625, 146.06808471679688, 150.6849365234375, 155.30178833007812, 159.91864013671875, 164.53550720214844, 169.15235900878906, 173.7692108154297, 178.3860626220703, 183.00291442871094, 187.61976623535156, 192.2366180419922, 196.85348510742188, 201.4703369140625, 206.08718872070312, 210.70404052734375, 215.32089233398438, 219.937744140625, 224.55459594726562, 229.17144775390625, 233.78829956054688, 238.40516662597656, 243.0220184326172, 247.6388702392578, 252.25572204589844, 256.8725891113281, 261.48944091796875, 266.1062927246094, 270.72314453125, 275.3399963378906, 279.95684814453125, 284.5736999511719, 289.1905517578125]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 10.0, 7.0, 9.0, 6.0, 14.0, 17.0, 9.0, 18.0, 18.0, 20.0, 21.0, 32.0, 29.0, 29.0, 28.0, 30.0, 40.0, 28.0, 34.0, 34.0, 35.0, 39.0, 39.0, 41.0, 27.0, 43.0, 36.0, 34.0, 27.0, 34.0, 21.0, 20.0, 21.0, 24.0, 19.0, 15.0, 13.0, 10.0, 10.0, 10.0, 6.0, 5.0, 5.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-23.33464813232422, -22.654212951660156, -21.973777770996094, -21.29334259033203, -20.6129093170166, -19.93247413635254, -19.252038955688477, -18.571603775024414, -17.891170501708984, -17.210735321044922, -16.53030014038086, -15.849865913391113, -15.169431686401367, -14.488996505737305, -13.808561325073242, -13.12812614440918, -12.447690963745117, -11.767255783081055, -11.086821556091309, -10.406386375427246, -9.7259521484375, -9.045516967773438, -8.365081787109375, -7.684647083282471, -7.004212379455566, -6.323777675628662, -5.643342971801758, -4.962907791137695, -4.282473087310791, -3.6020383834838867, -2.921603202819824, -2.24116849899292, -1.5607357025146484, -0.8803008794784546, -0.19986605644226074, 0.48056888580322266, 1.161003589630127, 1.8414382934570312, 2.5218734741210938, 3.202308177947998, 3.8827428817749023, 4.563177585601807, 5.243612289428711, 5.924047470092773, 6.604482173919678, 7.284916877746582, 7.9653520584106445, 8.64578628540039, 9.326221466064453, 10.006656646728516, 10.687090873718262, 11.367526054382324, 12.04796028137207, 12.728395462036133, 13.408830642700195, 14.089265823364258, 14.769700050354004, 15.450135231018066, 16.130569458007812, 16.811004638671875, 17.491439819335938, 18.171875, 18.852310180664062, 19.532743453979492, 20.213178634643555]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 3.0, 5.0, 6.0, 9.0, 5.0, 13.0, 13.0, 8.0, 18.0, 24.0, 18.0, 33.0, 27.0, 37.0, 32.0, 42.0, 42.0, 37.0, 50.0, 44.0, 50.0, 31.0, 48.0, 37.0, 34.0, 38.0, 41.0, 33.0, 25.0, 29.0, 21.0, 24.0, 17.0, 17.0, 15.0, 13.0, 12.0, 13.0, 4.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6474609375, -1.5796966552734375, -1.511932373046875, -1.4441680908203125, -1.37640380859375, -1.3086395263671875, -1.240875244140625, -1.1731109619140625, -1.1053466796875, -1.0375823974609375, -0.969818115234375, -0.9020538330078125, -0.83428955078125, -0.7665252685546875, -0.698760986328125, -0.6309967041015625, -0.563232421875, -0.4954681396484375, -0.427703857421875, -0.3599395751953125, -0.29217529296875, -0.2244110107421875, -0.156646728515625, -0.0888824462890625, -0.0211181640625, 0.0466461181640625, 0.114410400390625, 0.1821746826171875, 0.24993896484375, 0.3177032470703125, 0.385467529296875, 0.4532318115234375, 0.52099609375, 0.5887603759765625, 0.656524658203125, 0.7242889404296875, 0.79205322265625, 0.8598175048828125, 0.927581787109375, 0.9953460693359375, 1.0631103515625, 1.1308746337890625, 1.198638916015625, 1.2664031982421875, 1.33416748046875, 1.4019317626953125, 1.469696044921875, 1.5374603271484375, 1.605224609375, 1.6729888916015625, 1.740753173828125, 1.8085174560546875, 1.87628173828125, 1.9440460205078125, 2.011810302734375, 2.0795745849609375, 2.1473388671875, 2.2151031494140625, 2.282867431640625, 2.3506317138671875, 2.41839599609375, 2.4861602783203125, 2.553924560546875, 2.6216888427734375, 2.689453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 8.0, 5.0, 4.0, 4.0, 11.0, 17.0, 20.0, 39.0, 51.0, 62.0, 97.0, 198.0, 426.0, 1002.0, 2735.0, 8427.0, 32518.0, 168523.0, 1802343.0, 1954625.0, 174545.0, 34153.0, 9093.0, 3062.0, 1178.0, 443.0, 252.0, 129.0, 90.0, 58.0, 43.0, 34.0, 13.0, 19.0, 19.0, 12.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.82421875, -6.58062744140625, -6.3370361328125, -6.09344482421875, -5.849853515625, -5.60626220703125, -5.3626708984375, -5.11907958984375, -4.87548828125, -4.63189697265625, -4.3883056640625, -4.14471435546875, -3.901123046875, -3.65753173828125, -3.4139404296875, -3.17034912109375, -2.9267578125, -2.68316650390625, -2.4395751953125, -2.19598388671875, -1.952392578125, -1.70880126953125, -1.4652099609375, -1.22161865234375, -0.97802734375, -0.73443603515625, -0.4908447265625, -0.24725341796875, -0.003662109375, 0.23992919921875, 0.4835205078125, 0.72711181640625, 0.970703125, 1.21429443359375, 1.4578857421875, 1.70147705078125, 1.945068359375, 2.18865966796875, 2.4322509765625, 2.67584228515625, 2.91943359375, 3.16302490234375, 3.4066162109375, 3.65020751953125, 3.893798828125, 4.13739013671875, 4.3809814453125, 4.62457275390625, 4.8681640625, 5.11175537109375, 5.3553466796875, 5.59893798828125, 5.842529296875, 6.08612060546875, 6.3297119140625, 6.57330322265625, 6.81689453125, 7.06048583984375, 7.3040771484375, 7.54766845703125, 7.791259765625, 8.03485107421875, 8.2784423828125, 8.52203369140625, 8.765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 10.0, 17.0, 16.0, 30.0, 59.0, 97.0, 180.0, 313.0, 584.0, 871.0, 755.0, 513.0, 286.0, 142.0, 86.0, 53.0, 32.0, 14.0, 9.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.892333984375, -8.53466796875, -8.177001953125, -7.8193359375, -7.461669921875, -7.10400390625, -6.746337890625, -6.388671875, -6.031005859375, -5.67333984375, -5.315673828125, -4.9580078125, -4.600341796875, -4.24267578125, -3.885009765625, -3.52734375, -3.169677734375, -2.81201171875, -2.454345703125, -2.0966796875, -1.739013671875, -1.38134765625, -1.023681640625, -0.666015625, -0.308349609375, 0.04931640625, 0.406982421875, 0.7646484375, 1.122314453125, 1.47998046875, 1.837646484375, 2.1953125, 2.552978515625, 2.91064453125, 3.268310546875, 3.6259765625, 3.983642578125, 4.34130859375, 4.698974609375, 5.056640625, 5.414306640625, 5.77197265625, 6.129638671875, 6.4873046875, 6.844970703125, 7.20263671875, 7.560302734375, 7.91796875, 8.275634765625, 8.63330078125, 8.990966796875, 9.3486328125, 9.706298828125, 10.06396484375, 10.421630859375, 10.779296875, 11.136962890625, 11.49462890625, 11.852294921875, 12.2099609375, 12.567626953125, 12.92529296875, 13.282958984375, 13.640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 6.0, 8.0, 19.0, 39.0, 65.0, 110.0, 194.0, 353.0, 859.0, 2236.0, 8665.0, 54396.0, 640785.0, 3167072.0, 281443.0, 29701.0, 5326.0, 1658.0, 679.0, 290.0, 158.0, 90.0, 43.0, 29.0, 14.0, 17.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.2357177734375, -12.713623046875, -12.1915283203125, -11.66943359375, -11.1473388671875, -10.625244140625, -10.1031494140625, -9.5810546875, -9.0589599609375, -8.536865234375, -8.0147705078125, -7.49267578125, -6.9705810546875, -6.448486328125, -5.9263916015625, -5.404296875, -4.8822021484375, -4.360107421875, -3.8380126953125, -3.31591796875, -2.7938232421875, -2.271728515625, -1.7496337890625, -1.2275390625, -0.7054443359375, -0.183349609375, 0.3387451171875, 0.86083984375, 1.3829345703125, 1.905029296875, 2.4271240234375, 2.94921875, 3.4713134765625, 3.993408203125, 4.5155029296875, 5.03759765625, 5.5596923828125, 6.081787109375, 6.6038818359375, 7.1259765625, 7.6480712890625, 8.170166015625, 8.6922607421875, 9.21435546875, 9.7364501953125, 10.258544921875, 10.7806396484375, 11.302734375, 11.8248291015625, 12.346923828125, 12.8690185546875, 13.39111328125, 13.9132080078125, 14.435302734375, 14.9573974609375, 15.4794921875, 16.0015869140625, 16.523681640625, 17.0457763671875, 17.56787109375, 18.0899658203125, 18.612060546875, 19.1341552734375, 19.65625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 6.0, 6.0, 23.0, 38.0, 54.0, 38.0, 60.0, 78.0, 79.0, 109.0, 101.0, 73.0, 82.0, 69.0, 44.0, 35.0, 34.0, 30.0, 11.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-42.87489318847656, -41.83043670654297, -40.785980224609375, -39.741519927978516, -38.69706344604492, -37.65260696411133, -36.608150482177734, -35.56369400024414, -34.51923370361328, -33.47477722167969, -32.430320739746094, -31.385862350463867, -30.34140396118164, -29.296947479248047, -28.252490997314453, -27.20803451538086, -26.163578033447266, -25.119121551513672, -24.074663162231445, -23.03020668029785, -21.985748291015625, -20.94129180908203, -19.896835327148438, -18.852378845214844, -17.807920455932617, -16.763463973999023, -15.719005584716797, -14.674549102783203, -13.630091667175293, -12.585634231567383, -11.541177749633789, -10.496720314025879, -9.452266693115234, -8.407809257507324, -7.363352298736572, -6.31889533996582, -5.27443790435791, -4.22998046875, -3.185523509979248, -2.141066551208496, -1.096609115600586, -0.05215191841125488, 0.9923052787780762, 2.0367624759674072, 3.0812196731567383, 4.125677108764648, 5.1701340675354, 6.214591026306152, 7.2590484619140625, 8.303505897521973, 9.347963333129883, 10.392419815063477, 11.436877250671387, 12.481334686279297, 13.52579116821289, 14.5702486038208, 15.614706039428711, 16.659162521362305, 17.70362091064453, 18.748077392578125, 19.79253387451172, 20.836992263793945, 21.88144874572754, 22.925907135009766, 23.97036361694336]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 10.0, 14.0, 10.0, 14.0, 21.0, 22.0, 26.0, 30.0, 26.0, 29.0, 37.0, 43.0, 36.0, 39.0, 31.0, 41.0, 46.0, 38.0, 43.0, 37.0, 45.0, 55.0, 40.0, 36.0, 42.0, 31.0, 28.0, 18.0, 11.0, 13.0, 14.0, 10.0, 12.0, 9.0, 10.0, 6.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.03240966796875, -24.27315902709961, -23.51390838623047, -22.754655838012695, -21.995405197143555, -21.236154556274414, -20.47690200805664, -19.7176513671875, -18.95840072631836, -18.19915008544922, -17.439899444580078, -16.680646896362305, -15.921396255493164, -15.162145614624023, -14.402894020080566, -13.64364242553711, -12.884391784667969, -12.125141143798828, -11.365889549255371, -10.606637954711914, -9.847387313842773, -9.088136672973633, -8.328885078430176, -7.569633960723877, -6.810382843017578, -6.051131725311279, -5.2918806076049805, -4.532629489898682, -3.773378372192383, -3.014127254486084, -2.254876136779785, -1.4956250190734863, -0.7363739013671875, 0.022877216339111328, 0.7821283340454102, 1.541379451751709, 2.300630569458008, 3.0598816871643066, 3.8191328048706055, 4.578383922576904, 5.337635040283203, 6.096886157989502, 6.856137275695801, 7.6153883934021, 8.374639511108398, 9.133890151977539, 9.893141746520996, 10.652393341064453, 11.411643981933594, 12.170894622802734, 12.930146217346191, 13.689397811889648, 14.448648452758789, 15.20789909362793, 15.967150688171387, 16.726402282714844, 17.485652923583984, 18.244903564453125, 19.004154205322266, 19.76340675354004, 20.52265739440918, 21.28190803527832, 22.041160583496094, 22.800411224365234, 23.559661865234375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 8.0, 5.0, 11.0, 19.0, 16.0, 18.0, 22.0, 23.0, 25.0, 21.0, 33.0, 24.0, 52.0, 37.0, 38.0, 52.0, 38.0, 53.0, 48.0, 37.0, 30.0, 37.0, 35.0, 53.0, 30.0, 32.0, 22.0, 24.0, 24.0, 20.0, 14.0, 19.0, 10.0, 13.0, 13.0, 7.0, 7.0, 6.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8798828125, -1.8086700439453125, -1.737457275390625, -1.6662445068359375, -1.59503173828125, -1.5238189697265625, -1.452606201171875, -1.3813934326171875, -1.3101806640625, -1.2389678955078125, -1.167755126953125, -1.0965423583984375, -1.02532958984375, -0.9541168212890625, -0.882904052734375, -0.8116912841796875, -0.740478515625, -0.6692657470703125, -0.598052978515625, -0.5268402099609375, -0.45562744140625, -0.3844146728515625, -0.313201904296875, -0.2419891357421875, -0.1707763671875, -0.0995635986328125, -0.028350830078125, 0.0428619384765625, 0.11407470703125, 0.1852874755859375, 0.256500244140625, 0.3277130126953125, 0.39892578125, 0.4701385498046875, 0.541351318359375, 0.6125640869140625, 0.68377685546875, 0.7549896240234375, 0.826202392578125, 0.8974151611328125, 0.9686279296875, 1.0398406982421875, 1.111053466796875, 1.1822662353515625, 1.25347900390625, 1.3246917724609375, 1.395904541015625, 1.4671173095703125, 1.538330078125, 1.6095428466796875, 1.680755615234375, 1.7519683837890625, 1.82318115234375, 1.8943939208984375, 1.965606689453125, 2.0368194580078125, 2.1080322265625, 2.1792449951171875, 2.250457763671875, 2.3216705322265625, 2.39288330078125, 2.4640960693359375, 2.535308837890625, 2.6065216064453125, 2.677734375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 5.0, 6.0, 13.0, 24.0, 25.0, 44.0, 56.0, 95.0, 151.0, 217.0, 325.0, 513.0, 780.0, 1194.0, 1880.0, 2944.0, 4530.0, 6999.0, 11022.0, 17226.0, 27173.0, 45270.0, 79057.0, 156038.0, 360925.0, 143313.0, 74693.0, 42488.0, 25745.0, 16261.0, 10590.0, 6820.0, 4321.0, 2717.0, 1839.0, 1161.0, 722.0, 497.0, 298.0, 195.0, 132.0, 89.0, 52.0, 34.0, 28.0, 25.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1942138671875, -0.18803787231445312, -0.18186187744140625, -0.17568588256835938, -0.1695098876953125, -0.16333389282226562, -0.15715789794921875, -0.15098190307617188, -0.144805908203125, -0.13862991333007812, -0.13245391845703125, -0.12627792358398438, -0.1201019287109375, -0.11392593383789062, -0.10774993896484375, -0.10157394409179688, -0.09539794921875, -0.08922195434570312, -0.08304595947265625, -0.07686996459960938, -0.0706939697265625, -0.06451797485351562, -0.05834197998046875, -0.052165985107421875, -0.045989990234375, -0.039813995361328125, -0.03363800048828125, -0.027462005615234375, -0.0212860107421875, -0.015110015869140625, -0.00893402099609375, -0.002758026123046875, 0.00341796875, 0.009593963623046875, 0.01576995849609375, 0.021945953369140625, 0.0281219482421875, 0.034297943115234375, 0.04047393798828125, 0.046649932861328125, 0.052825927734375, 0.059001922607421875, 0.06517791748046875, 0.07135391235351562, 0.0775299072265625, 0.08370590209960938, 0.08988189697265625, 0.09605789184570312, 0.10223388671875, 0.10840988159179688, 0.11458587646484375, 0.12076187133789062, 0.1269378662109375, 0.13311386108398438, 0.13928985595703125, 0.14546585083007812, 0.151641845703125, 0.15781784057617188, 0.16399383544921875, 0.17016983032226562, 0.1763458251953125, 0.18252182006835938, 0.18869781494140625, 0.19487380981445312, 0.2010498046875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 5.0, 9.0, 14.0, 14.0, 15.0, 18.0, 20.0, 19.0, 30.0, 25.0, 31.0, 27.0, 25.0, 37.0, 36.0, 44.0, 37.0, 31.0, 1070.0, 39.0, 40.0, 42.0, 40.0, 31.0, 46.0, 32.0, 33.0, 28.0, 28.0, 19.0, 15.0, 18.0, 19.0, 9.0, 18.0, 6.0, 6.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.6396484375, -1.592010498046875, -1.54437255859375, -1.496734619140625, -1.4490966796875, -1.401458740234375, -1.35382080078125, -1.306182861328125, -1.258544921875, -1.210906982421875, -1.16326904296875, -1.115631103515625, -1.0679931640625, -1.020355224609375, -0.97271728515625, -0.925079345703125, -0.87744140625, -0.829803466796875, -0.78216552734375, -0.734527587890625, -0.6868896484375, -0.639251708984375, -0.59161376953125, -0.543975830078125, -0.496337890625, -0.448699951171875, -0.40106201171875, -0.353424072265625, -0.3057861328125, -0.258148193359375, -0.21051025390625, -0.162872314453125, -0.115234375, -0.067596435546875, -0.01995849609375, 0.027679443359375, 0.0753173828125, 0.122955322265625, 0.17059326171875, 0.218231201171875, 0.265869140625, 0.313507080078125, 0.36114501953125, 0.408782958984375, 0.4564208984375, 0.504058837890625, 0.55169677734375, 0.599334716796875, 0.64697265625, 0.694610595703125, 0.74224853515625, 0.789886474609375, 0.8375244140625, 0.885162353515625, 0.93280029296875, 0.980438232421875, 1.028076171875, 1.075714111328125, 1.12335205078125, 1.170989990234375, 1.2186279296875, 1.266265869140625, 1.31390380859375, 1.361541748046875, 1.4091796875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 21.0, 29.0, 33.0, 42.0, 79.0, 112.0, 189.0, 207.0, 327.0, 521.0, 717.0, 1043.0, 1666.0, 2353.0, 3655.0, 5569.0, 8585.0, 13819.0, 22474.0, 37862.0, 67531.0, 135675.0, 1414040.0, 181199.0, 82923.0, 45175.0, 26314.0, 16023.0, 10032.0, 6345.0, 4183.0, 2732.0, 1803.0, 1201.0, 828.0, 576.0, 403.0, 248.0, 187.0, 115.0, 86.0, 60.0, 39.0, 32.0, 19.0, 18.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09123802185058594, -0.08805465698242188, -0.08487129211425781, -0.08168792724609375, -0.07850456237792969, -0.07532119750976562, -0.07213783264160156, -0.0689544677734375, -0.06577110290527344, -0.06258773803710938, -0.05940437316894531, -0.05622100830078125, -0.05303764343261719, -0.049854278564453125, -0.04667091369628906, -0.043487548828125, -0.04030418395996094, -0.037120819091796875, -0.03393745422363281, -0.03075408935546875, -0.027570724487304688, -0.024387359619140625, -0.021203994750976562, -0.0180206298828125, -0.014837265014648438, -0.011653900146484375, -0.008470535278320312, -0.00528717041015625, -0.0021038055419921875, 0.001079559326171875, 0.0042629241943359375, 0.0074462890625, 0.010629653930664062, 0.013813018798828125, 0.016996383666992188, 0.02017974853515625, 0.023363113403320312, 0.026546478271484375, 0.029729843139648438, 0.0329132080078125, 0.03609657287597656, 0.039279937744140625, 0.04246330261230469, 0.04564666748046875, 0.04883003234863281, 0.052013397216796875, 0.05519676208496094, 0.058380126953125, 0.06156349182128906, 0.06474685668945312, 0.06793022155761719, 0.07111358642578125, 0.07429695129394531, 0.07748031616210938, 0.08066368103027344, 0.0838470458984375, 0.08703041076660156, 0.09021377563476562, 0.09339714050292969, 0.09658050537109375, 0.09976387023925781, 0.10294723510742188, 0.10613059997558594, 0.10931396484375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 11.0, 5.0, 14.0, 13.0, 14.0, 27.0, 19.0, 19.0, 31.0, 32.0, 43.0, 55.0, 61.0, 112.0, 122.0, 97.0, 58.0, 32.0, 42.0, 30.0, 26.0, 27.0, 20.0, 14.0, 18.0, 10.0, 8.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0073184967041016e-05, -9.718351066112518e-06, -9.363517165184021e-06, -9.008683264255524e-06, -8.653849363327026e-06, -8.299015462398529e-06, -7.944181561470032e-06, -7.5893476605415344e-06, -7.234513759613037e-06, -6.87967985868454e-06, -6.5248459577560425e-06, -6.170012056827545e-06, -5.815178155899048e-06, -5.4603442549705505e-06, -5.105510354042053e-06, -4.750676453113556e-06, -4.395842552185059e-06, -4.041008651256561e-06, -3.686174750328064e-06, -3.3313408493995667e-06, -2.9765069484710693e-06, -2.621673047542572e-06, -2.2668391466140747e-06, -1.9120052456855774e-06, -1.55717134475708e-06, -1.2023374438285828e-06, -8.475035429000854e-07, -4.926696419715881e-07, -1.3783574104309082e-07, 2.169981598854065e-07, 5.718320608139038e-07, 9.266659617424011e-07, 1.2814998626708984e-06, 1.6363337635993958e-06, 1.991167664527893e-06, 2.3460015654563904e-06, 2.7008354663848877e-06, 3.055669367313385e-06, 3.4105032682418823e-06, 3.7653371691703796e-06, 4.120171070098877e-06, 4.475004971027374e-06, 4.829838871955872e-06, 5.184672772884369e-06, 5.539506673812866e-06, 5.8943405747413635e-06, 6.249174475669861e-06, 6.604008376598358e-06, 6.9588422775268555e-06, 7.313676178455353e-06, 7.66851007938385e-06, 8.023343980312347e-06, 8.378177881240845e-06, 8.733011782169342e-06, 9.08784568309784e-06, 9.442679584026337e-06, 9.797513484954834e-06, 1.0152347385883331e-05, 1.0507181286811829e-05, 1.0862015187740326e-05, 1.1216849088668823e-05, 1.157168298959732e-05, 1.1926516890525818e-05, 1.2281350791454315e-05, 1.2636184692382812e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 10.0, 26.0, 38.0, 41.0, 65.0, 93.0, 200.0, 508.0, 1789.0, 8901.0, 67504.0, 799523.0, 149520.0, 16174.0, 2801.0, 698.0, 277.0, 133.0, 69.0, 38.0, 37.0, 16.0, 16.0, 16.0, 10.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021445751190185547, -0.00020826980471611023, -0.000202082097530365, -0.00019589439034461975, -0.0001897066831588745, -0.00018351897597312927, -0.00017733126878738403, -0.0001711435616016388, -0.00016495585441589355, -0.00015876814723014832, -0.00015258044004440308, -0.00014639273285865784, -0.0001402050256729126, -0.00013401731848716736, -0.00012782961130142212, -0.00012164190411567688, -0.00011545419692993164, -0.0001092664897441864, -0.00010307878255844116, -9.689107537269592e-05, -9.070336818695068e-05, -8.451566100120544e-05, -7.83279538154602e-05, -7.214024662971497e-05, -6.595253944396973e-05, -5.976483225822449e-05, -5.357712507247925e-05, -4.738941788673401e-05, -4.120171070098877e-05, -3.501400351524353e-05, -2.882629632949829e-05, -2.2638589143753052e-05, -1.6450881958007812e-05, -1.0263174772262573e-05, -4.075467586517334e-06, 2.1122395992279053e-06, 8.299946784973145e-06, 1.4487653970718384e-05, 2.0675361156463623e-05, 2.6863068342208862e-05, 3.30507755279541e-05, 3.923848271369934e-05, 4.542618989944458e-05, 5.161389708518982e-05, 5.780160427093506e-05, 6.39893114566803e-05, 7.017701864242554e-05, 7.636472582817078e-05, 8.255243301391602e-05, 8.874014019966125e-05, 9.49278473854065e-05, 0.00010111555457115173, 0.00010730326175689697, 0.00011349096894264221, 0.00011967867612838745, 0.0001258663833141327, 0.00013205409049987793, 0.00013824179768562317, 0.0001444295048713684, 0.00015061721205711365, 0.0001568049192428589, 0.00016299262642860413, 0.00016918033361434937, 0.0001753680408000946, 0.00018155574798583984]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 13.0, 19.0, 20.0, 26.0, 38.0, 59.0, 90.0, 101.0, 102.0, 108.0, 82.0, 75.0, 61.0, 47.0, 35.0, 30.0, 9.0, 17.0, 10.0, 4.0, 6.0, 13.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1065905709983781e-05, -1.0669057701306883e-05, -1.0272209692629986e-05, -9.875361683953088e-06, -9.47851367527619e-06, -9.081665666599292e-06, -8.684817657922395e-06, -8.287969649245497e-06, -7.891121640568599e-06, -7.494273631891701e-06, -7.097425623214804e-06, -6.700577614537906e-06, -6.303729605861008e-06, -5.9068815971841104e-06, -5.510033588507213e-06, -5.113185579830315e-06, -4.716337571153417e-06, -4.3194895624765195e-06, -3.922641553799622e-06, -3.525793545122724e-06, -3.1289455364458263e-06, -2.7320975277689286e-06, -2.335249519092031e-06, -1.938401510415133e-06, -1.5415535017382354e-06, -1.1447054930613376e-06, -7.478574843844399e-07, -3.5100947570754215e-07, 4.583853296935558e-08, 4.426865416462533e-07, 8.39534550323151e-07, 1.2363825590000488e-06, 1.6332305676769465e-06, 2.0300785763538443e-06, 2.426926585030742e-06, 2.8237745937076397e-06, 3.2206226023845375e-06, 3.617470611061435e-06, 4.014318619738333e-06, 4.411166628415231e-06, 4.808014637092128e-06, 5.204862645769026e-06, 5.601710654445924e-06, 5.998558663122822e-06, 6.395406671799719e-06, 6.792254680476617e-06, 7.189102689153515e-06, 7.5859506978304125e-06, 7.98279870650731e-06, 8.379646715184208e-06, 8.776494723861106e-06, 9.173342732538003e-06, 9.570190741214901e-06, 9.967038749891799e-06, 1.0363886758568697e-05, 1.0760734767245594e-05, 1.1157582775922492e-05, 1.155443078459939e-05, 1.1951278793276288e-05, 1.2348126801953185e-05, 1.2744974810630083e-05, 1.314182281930698e-05, 1.3538670827983879e-05, 1.3935518836660776e-05, 1.4332366845337674e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 5.0, 5.0, 5.0, 17.0, 19.0, 28.0, 32.0, 35.0, 22.0, 42.0, 39.0, 32.0, 54.0, 38.0, 36.0, 36.0, 33.0, 42.0, 55.0, 43.0, 36.0, 37.0, 48.0, 29.0, 37.0, 30.0, 27.0, 18.0, 23.0, 15.0, 18.0, 13.0, 10.0, 15.0, 6.0, 0.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.886649549007416e-06, -4.706904292106628e-06, -4.527159035205841e-06, -4.347413778305054e-06, -4.167668521404266e-06, -3.987923264503479e-06, -3.8081780076026917e-06, -3.6284327507019043e-06, -3.448687493801117e-06, -3.2689422369003296e-06, -3.0891969799995422e-06, -2.909451723098755e-06, -2.7297064661979675e-06, -2.54996120929718e-06, -2.370215952396393e-06, -2.1904706954956055e-06, -2.010725438594818e-06, -1.8309801816940308e-06, -1.6512349247932434e-06, -1.471489667892456e-06, -1.2917444109916687e-06, -1.1119991540908813e-06, -9.32253897190094e-07, -7.525086402893066e-07, -5.727633833885193e-07, -3.9301812648773193e-07, -2.1327286958694458e-07, -3.3527612686157227e-08, 1.4621764421463013e-07, 3.259629011154175e-07, 5.057081580162048e-07, 6.854534149169922e-07, 8.651986718177795e-07, 1.044943928718567e-06, 1.2246891856193542e-06, 1.4044344425201416e-06, 1.584179699420929e-06, 1.7639249563217163e-06, 1.9436702132225037e-06, 2.123415470123291e-06, 2.3031607270240784e-06, 2.4829059839248657e-06, 2.662651240825653e-06, 2.8423964977264404e-06, 3.0221417546272278e-06, 3.201887011528015e-06, 3.3816322684288025e-06, 3.56137752532959e-06, 3.741122782230377e-06, 3.9208680391311646e-06, 4.100613296031952e-06, 4.280358552932739e-06, 4.460103809833527e-06, 4.639849066734314e-06, 4.819594323635101e-06, 4.999339580535889e-06, 5.179084837436676e-06, 5.358830094337463e-06, 5.538575351238251e-06, 5.718320608139038e-06, 5.8980658650398254e-06, 6.077811121940613e-06, 6.2575563788414e-06, 6.4373016357421875e-06]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 8.0, 5.0, 11.0, 19.0, 16.0, 18.0, 22.0, 23.0, 25.0, 21.0, 33.0, 24.0, 52.0, 37.0, 38.0, 52.0, 38.0, 53.0, 48.0, 37.0, 30.0, 37.0, 35.0, 53.0, 30.0, 32.0, 22.0, 24.0, 24.0, 20.0, 14.0, 19.0, 10.0, 13.0, 13.0, 7.0, 7.0, 6.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8798828125, -1.8086700439453125, -1.737457275390625, -1.6662445068359375, -1.59503173828125, -1.5238189697265625, -1.452606201171875, -1.3813934326171875, -1.3101806640625, -1.2389678955078125, -1.167755126953125, -1.0965423583984375, -1.02532958984375, -0.9541168212890625, -0.882904052734375, -0.8116912841796875, -0.740478515625, -0.6692657470703125, -0.598052978515625, -0.5268402099609375, -0.45562744140625, -0.3844146728515625, -0.313201904296875, -0.2419891357421875, -0.1707763671875, -0.0995635986328125, -0.028350830078125, 0.0428619384765625, 0.11407470703125, 0.1852874755859375, 0.256500244140625, 0.3277130126953125, 0.39892578125, 0.4701385498046875, 0.541351318359375, 0.6125640869140625, 0.68377685546875, 0.7549896240234375, 0.826202392578125, 0.8974151611328125, 0.9686279296875, 1.0398406982421875, 1.111053466796875, 1.1822662353515625, 1.25347900390625, 1.3246917724609375, 1.395904541015625, 1.4671173095703125, 1.538330078125, 1.6095428466796875, 1.680755615234375, 1.7519683837890625, 1.82318115234375, 1.8943939208984375, 1.965606689453125, 2.0368194580078125, 2.1080322265625, 2.1792449951171875, 2.250457763671875, 2.3216705322265625, 2.39288330078125, 2.4640960693359375, 2.535308837890625, 2.6065216064453125, 2.677734375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 18.0, 21.0, 34.0, 54.0, 74.0, 129.0, 200.0, 330.0, 479.0, 775.0, 1407.0, 2464.0, 4573.0, 8650.0, 16946.0, 36040.0, 87251.0, 257796.0, 399171.0, 134262.0, 50520.0, 22645.0, 11225.0, 5837.0, 3144.0, 1751.0, 984.0, 669.0, 372.0, 213.0, 158.0, 95.0, 80.0, 52.0, 41.0, 27.0, 12.0, 11.0, 4.0, 4.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.829376220703125, -2.72906494140625, -2.628753662109375, -2.5284423828125, -2.428131103515625, -2.32781982421875, -2.227508544921875, -2.127197265625, -2.026885986328125, -1.92657470703125, -1.826263427734375, -1.7259521484375, -1.625640869140625, -1.52532958984375, -1.425018310546875, -1.32470703125, -1.224395751953125, -1.12408447265625, -1.023773193359375, -0.9234619140625, -0.823150634765625, -0.72283935546875, -0.622528076171875, -0.522216796875, -0.421905517578125, -0.32159423828125, -0.221282958984375, -0.1209716796875, -0.020660400390625, 0.07965087890625, 0.179962158203125, 0.2802734375, 0.380584716796875, 0.48089599609375, 0.581207275390625, 0.6815185546875, 0.781829833984375, 0.88214111328125, 0.982452392578125, 1.082763671875, 1.183074951171875, 1.28338623046875, 1.383697509765625, 1.4840087890625, 1.584320068359375, 1.68463134765625, 1.784942626953125, 1.88525390625, 1.985565185546875, 2.08587646484375, 2.186187744140625, 2.2864990234375, 2.386810302734375, 2.48712158203125, 2.587432861328125, 2.687744140625, 2.788055419921875, 2.88836669921875, 2.988677978515625, 3.0889892578125, 3.189300537109375, 3.28961181640625, 3.389923095703125, 3.490234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 11.0, 4.0, 9.0, 13.0, 8.0, 15.0, 25.0, 15.0, 29.0, 30.0, 36.0, 51.0, 43.0, 31.0, 53.0, 59.0, 95.0, 186.0, 1612.0, 187.0, 87.0, 71.0, 47.0, 48.0, 49.0, 31.0, 33.0, 18.0, 22.0, 17.0, 24.0, 10.0, 14.0, 18.0, 11.0, 10.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.50384521484375, -8.2420654296875, -7.98028564453125, -7.718505859375, -7.45672607421875, -7.1949462890625, -6.93316650390625, -6.67138671875, -6.40960693359375, -6.1478271484375, -5.88604736328125, -5.624267578125, -5.36248779296875, -5.1007080078125, -4.83892822265625, -4.5771484375, -4.31536865234375, -4.0535888671875, -3.79180908203125, -3.530029296875, -3.26824951171875, -3.0064697265625, -2.74468994140625, -2.48291015625, -2.22113037109375, -1.9593505859375, -1.69757080078125, -1.435791015625, -1.17401123046875, -0.9122314453125, -0.65045166015625, -0.388671875, -0.12689208984375, 0.1348876953125, 0.39666748046875, 0.658447265625, 0.92022705078125, 1.1820068359375, 1.44378662109375, 1.70556640625, 1.96734619140625, 2.2291259765625, 2.49090576171875, 2.752685546875, 3.01446533203125, 3.2762451171875, 3.53802490234375, 3.7998046875, 4.06158447265625, 4.3233642578125, 4.58514404296875, 4.846923828125, 5.10870361328125, 5.3704833984375, 5.63226318359375, 5.89404296875, 6.15582275390625, 6.4176025390625, 6.67938232421875, 6.941162109375, 7.20294189453125, 7.4647216796875, 7.72650146484375, 7.98828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 12.0, 8.0, 14.0, 18.0, 16.0, 18.0, 24.0, 33.0, 50.0, 50.0, 113.0, 150.0, 297.0, 640.0, 1847.0, 8404.0, 60584.0, 2413421.0, 619096.0, 32952.0, 5363.0, 1398.0, 478.0, 237.0, 151.0, 95.0, 56.0, 43.0, 41.0, 21.0, 21.0, 8.0, 11.0, 10.0, 8.0, 7.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.4482421875, -12.044921875, -11.6416015625, -11.23828125, -10.8349609375, -10.431640625, -10.0283203125, -9.625, -9.2216796875, -8.818359375, -8.4150390625, -8.01171875, -7.6083984375, -7.205078125, -6.8017578125, -6.3984375, -5.9951171875, -5.591796875, -5.1884765625, -4.78515625, -4.3818359375, -3.978515625, -3.5751953125, -3.171875, -2.7685546875, -2.365234375, -1.9619140625, -1.55859375, -1.1552734375, -0.751953125, -0.3486328125, 0.0546875, 0.4580078125, 0.861328125, 1.2646484375, 1.66796875, 2.0712890625, 2.474609375, 2.8779296875, 3.28125, 3.6845703125, 4.087890625, 4.4912109375, 4.89453125, 5.2978515625, 5.701171875, 6.1044921875, 6.5078125, 6.9111328125, 7.314453125, 7.7177734375, 8.12109375, 8.5244140625, 8.927734375, 9.3310546875, 9.734375, 10.1376953125, 10.541015625, 10.9443359375, 11.34765625, 11.7509765625, 12.154296875, 12.5576171875, 12.9609375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 77.0, 251.0, 452.0, 207.0, 25.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.196483612060547, -8.64041519165039, -6.084347724914551, -3.5282797813415527, -0.9722118377685547, 1.5838565826416016, 4.139924049377441, 6.695991516113281, 9.252059936523438, 11.808128356933594, 14.364195823669434, 16.920263290405273, 19.47633171081543, 22.032400131225586, 24.58846664428711, 27.144535064697266, 29.700603485107422, 32.25667190551758, 34.812740325927734, 37.36880874633789, 39.92487335205078, 42.48094177246094, 45.037010192871094, 47.59307861328125, 50.149147033691406, 52.70521545410156, 55.26128387451172, 57.817352294921875, 60.37342071533203, 62.92948913574219, 65.48555755615234, 68.0416259765625, 70.59768676757812, 73.15375518798828, 75.70982360839844, 78.2658920288086, 80.82196044921875, 83.3780288696289, 85.93409729003906, 88.49015808105469, 91.04623413085938, 93.60230255126953, 96.15837097167969, 98.71443939208984, 101.2705078125, 103.82657623291016, 106.38264465332031, 108.93870544433594, 111.4947738647461, 114.05084228515625, 116.6069107055664, 119.16297912597656, 121.71904754638672, 124.27511596679688, 126.83118438720703, 129.3872528076172, 131.9433135986328, 134.49937438964844, 137.05545043945312, 139.61151123046875, 142.16758728027344, 144.72364807128906, 147.27972412109375, 149.83578491210938, 152.39186096191406]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 7.0, 7.0, 10.0, 10.0, 10.0, 24.0, 20.0, 20.0, 33.0, 25.0, 29.0, 20.0, 28.0, 22.0, 36.0, 36.0, 24.0, 37.0, 32.0, 42.0, 39.0, 44.0, 40.0, 35.0, 26.0, 37.0, 39.0, 29.0, 31.0, 29.0, 17.0, 24.0, 19.0, 12.0, 15.0, 17.0, 11.0, 6.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.194759368896484, -25.4191837310791, -24.64360809326172, -23.86803436279297, -23.092458724975586, -22.316883087158203, -21.54130744934082, -20.765731811523438, -19.990158081054688, -19.214582443237305, -18.439006805419922, -17.663433074951172, -16.88785743713379, -16.112281799316406, -15.336706161499023, -14.56113052368164, -13.785554885864258, -13.009979248046875, -12.234404563903809, -11.458828926086426, -10.68325424194336, -9.907678604125977, -9.132102966308594, -8.356527328491211, -7.5809526443481445, -6.80537748336792, -6.029802322387695, -5.2542266845703125, -4.478651523590088, -3.7030763626098633, -2.9275007247924805, -2.151925563812256, -1.3763504028320312, -0.6007751226425171, 0.17480015754699707, 0.9503755569458008, 1.7259507179260254, 2.50152587890625, 3.277101516723633, 4.052676677703857, 4.828251838684082, 5.603826999664307, 6.379402160644531, 7.154977798461914, 7.930552959442139, 8.706128120422363, 9.481703758239746, 10.257278442382812, 11.032854080200195, 11.808429718017578, 12.584004402160645, 13.359580039978027, 14.135154724121094, 14.910730361938477, 15.68630599975586, 16.461881637573242, 17.237457275390625, 18.013032913208008, 18.78860855102539, 19.56418228149414, 20.339757919311523, 21.115333557128906, 21.89090919494629, 22.666484832763672, 23.442058563232422]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 5.0, 11.0, 8.0, 16.0, 19.0, 13.0, 25.0, 29.0, 21.0, 24.0, 29.0, 26.0, 47.0, 29.0, 45.0, 35.0, 53.0, 39.0, 56.0, 31.0, 37.0, 32.0, 35.0, 38.0, 39.0, 34.0, 27.0, 23.0, 24.0, 15.0, 25.0, 15.0, 16.0, 15.0, 14.0, 6.0, 7.0, 4.0, 5.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.048828125, -1.97735595703125, -1.9058837890625, -1.83441162109375, -1.762939453125, -1.69146728515625, -1.6199951171875, -1.54852294921875, -1.47705078125, -1.40557861328125, -1.3341064453125, -1.26263427734375, -1.191162109375, -1.11968994140625, -1.0482177734375, -0.97674560546875, -0.9052734375, -0.83380126953125, -0.7623291015625, -0.69085693359375, -0.619384765625, -0.54791259765625, -0.4764404296875, -0.40496826171875, -0.33349609375, -0.26202392578125, -0.1905517578125, -0.11907958984375, -0.047607421875, 0.02386474609375, 0.0953369140625, 0.16680908203125, 0.23828125, 0.30975341796875, 0.3812255859375, 0.45269775390625, 0.524169921875, 0.59564208984375, 0.6671142578125, 0.73858642578125, 0.81005859375, 0.88153076171875, 0.9530029296875, 1.02447509765625, 1.095947265625, 1.16741943359375, 1.2388916015625, 1.31036376953125, 1.3818359375, 1.45330810546875, 1.5247802734375, 1.59625244140625, 1.667724609375, 1.73919677734375, 1.8106689453125, 1.88214111328125, 1.95361328125, 2.02508544921875, 2.0965576171875, 2.16802978515625, 2.239501953125, 2.31097412109375, 2.3824462890625, 2.45391845703125, 2.525390625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 4.0, 13.0, 5.0, 13.0, 18.0, 28.0, 35.0, 49.0, 80.0, 128.0, 239.0, 546.0, 1209.0, 3478.0, 12003.0, 52621.0, 327260.0, 2784266.0, 877603.0, 103810.0, 21545.0, 5725.0, 1942.0, 773.0, 354.0, 192.0, 86.0, 77.0, 43.0, 33.0, 17.0, 18.0, 13.0, 9.0, 11.0, 10.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.7578125, -6.5047607421875, -6.251708984375, -5.9986572265625, -5.74560546875, -5.4925537109375, -5.239501953125, -4.9864501953125, -4.7333984375, -4.4803466796875, -4.227294921875, -3.9742431640625, -3.72119140625, -3.4681396484375, -3.215087890625, -2.9620361328125, -2.708984375, -2.4559326171875, -2.202880859375, -1.9498291015625, -1.69677734375, -1.4437255859375, -1.190673828125, -0.9376220703125, -0.6845703125, -0.4315185546875, -0.178466796875, 0.0745849609375, 0.32763671875, 0.5806884765625, 0.833740234375, 1.0867919921875, 1.33984375, 1.5928955078125, 1.845947265625, 2.0989990234375, 2.35205078125, 2.6051025390625, 2.858154296875, 3.1112060546875, 3.3642578125, 3.6173095703125, 3.870361328125, 4.1234130859375, 4.37646484375, 4.6295166015625, 4.882568359375, 5.1356201171875, 5.388671875, 5.6417236328125, 5.894775390625, 6.1478271484375, 6.40087890625, 6.6539306640625, 6.906982421875, 7.1600341796875, 7.4130859375, 7.6661376953125, 7.919189453125, 8.1722412109375, 8.42529296875, 8.6783447265625, 8.931396484375, 9.1844482421875, 9.4375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 19.0, 24.0, 32.0, 51.0, 89.0, 141.0, 174.0, 304.0, 471.0, 650.0, 697.0, 468.0, 329.0, 233.0, 125.0, 95.0, 55.0, 24.0, 30.0, 12.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.087890625, -6.79296875, -6.498046875, -6.203125, -5.908203125, -5.61328125, -5.318359375, -5.0234375, -4.728515625, -4.43359375, -4.138671875, -3.84375, -3.548828125, -3.25390625, -2.958984375, -2.6640625, -2.369140625, -2.07421875, -1.779296875, -1.484375, -1.189453125, -0.89453125, -0.599609375, -0.3046875, -0.009765625, 0.28515625, 0.580078125, 0.875, 1.169921875, 1.46484375, 1.759765625, 2.0546875, 2.349609375, 2.64453125, 2.939453125, 3.234375, 3.529296875, 3.82421875, 4.119140625, 4.4140625, 4.708984375, 5.00390625, 5.298828125, 5.59375, 5.888671875, 6.18359375, 6.478515625, 6.7734375, 7.068359375, 7.36328125, 7.658203125, 7.953125, 8.248046875, 8.54296875, 8.837890625, 9.1328125, 9.427734375, 9.72265625, 10.017578125, 10.3125, 10.607421875, 10.90234375, 11.197265625, 11.4921875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 4.0, 4.0, 8.0, 16.0, 20.0, 29.0, 57.0, 87.0, 126.0, 233.0, 448.0, 955.0, 2477.0, 8274.0, 37861.0, 280691.0, 2793360.0, 949741.0, 96096.0, 16612.0, 4278.0, 1447.0, 680.0, 313.0, 181.0, 109.0, 72.0, 36.0, 23.0, 15.0, 12.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.203125, -15.73681640625, -15.2705078125, -14.80419921875, -14.337890625, -13.87158203125, -13.4052734375, -12.93896484375, -12.47265625, -12.00634765625, -11.5400390625, -11.07373046875, -10.607421875, -10.14111328125, -9.6748046875, -9.20849609375, -8.7421875, -8.27587890625, -7.8095703125, -7.34326171875, -6.876953125, -6.41064453125, -5.9443359375, -5.47802734375, -5.01171875, -4.54541015625, -4.0791015625, -3.61279296875, -3.146484375, -2.68017578125, -2.2138671875, -1.74755859375, -1.28125, -0.81494140625, -0.3486328125, 0.11767578125, 0.583984375, 1.05029296875, 1.5166015625, 1.98291015625, 2.44921875, 2.91552734375, 3.3818359375, 3.84814453125, 4.314453125, 4.78076171875, 5.2470703125, 5.71337890625, 6.1796875, 6.64599609375, 7.1123046875, 7.57861328125, 8.044921875, 8.51123046875, 8.9775390625, 9.44384765625, 9.91015625, 10.37646484375, 10.8427734375, 11.30908203125, 11.775390625, 12.24169921875, 12.7080078125, 13.17431640625, 13.640625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 14.0, 30.0, 31.0, 33.0, 49.0, 70.0, 74.0, 78.0, 89.0, 97.0, 91.0, 75.0, 46.0, 63.0, 51.0, 42.0, 24.0, 16.0, 12.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.342891693115234, -22.248775482177734, -21.1546573638916, -20.0605411529541, -18.96642303466797, -17.87230682373047, -16.77819061279297, -15.684073448181152, -14.589956283569336, -13.49583911895752, -12.401721954345703, -11.307605743408203, -10.213488578796387, -9.11937141418457, -8.02525520324707, -6.931138038635254, -5.8370208740234375, -4.742903709411621, -3.648787021636963, -2.5546700954437256, -1.4605531692504883, -0.3664360046386719, 0.7276806831359863, 1.8217973709106445, 2.915914535522461, 4.010031700134277, 5.1041483879089355, 6.198265075683594, 7.29238224029541, 8.386499404907227, 9.480615615844727, 10.574732780456543, 11.668853759765625, 12.762970924377441, 13.857088088989258, 14.951204299926758, 16.04532241821289, 17.13943862915039, 18.23355484008789, 19.32767105102539, 20.421789169311523, 21.515905380249023, 22.610023498535156, 23.704139709472656, 24.798255920410156, 25.89237403869629, 26.98649024963379, 28.080608367919922, 29.174724578857422, 30.268840789794922, 31.362958908081055, 32.45707702636719, 33.55119323730469, 34.64530944824219, 35.73942565917969, 36.83354187011719, 37.92765808105469, 39.02177429199219, 40.11589050292969, 41.21001052856445, 42.30412673950195, 43.39824295043945, 44.49235916137695, 45.58647537231445, 46.68059539794922]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 4.0, 8.0, 6.0, 16.0, 11.0, 24.0, 11.0, 16.0, 21.0, 20.0, 24.0, 23.0, 24.0, 32.0, 32.0, 42.0, 38.0, 32.0, 40.0, 38.0, 43.0, 46.0, 45.0, 42.0, 28.0, 41.0, 34.0, 35.0, 30.0, 26.0, 24.0, 23.0, 20.0, 13.0, 14.0, 10.0, 10.0, 9.0, 7.0, 5.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-23.922035217285156, -23.244312286376953, -22.56658935546875, -21.888866424560547, -21.211143493652344, -20.53342056274414, -19.855697631835938, -19.177974700927734, -18.50025177001953, -17.822528839111328, -17.144805908203125, -16.467082977294922, -15.789360046386719, -15.111637115478516, -14.433913230895996, -13.756190299987793, -13.078466415405273, -12.40074348449707, -11.723020553588867, -11.045297622680664, -10.367574691772461, -9.689851760864258, -9.012127876281738, -8.334404945373535, -7.656682014465332, -6.978959083557129, -6.301236152648926, -5.6235127449035645, -4.945789813995361, -4.268066883087158, -3.590343475341797, -2.9126205444335938, -2.2348976135253906, -1.557174563407898, -0.8794515132904053, -0.20172834396362305, 0.4759945869445801, 1.1537175178527832, 1.8314409255981445, 2.5091638565063477, 3.186886787414551, 3.864609718322754, 4.542332649230957, 5.220056056976318, 5.8977789878845215, 6.575501918792725, 7.253225326538086, 7.930948257446289, 8.608671188354492, 9.286394119262695, 9.964117050170898, 10.641839981079102, 11.319562911987305, 11.997285842895508, 12.675009727478027, 13.35273265838623, 14.030455589294434, 14.708178520202637, 15.38590145111084, 16.06362533569336, 16.741348266601562, 17.419071197509766, 18.09679412841797, 18.774517059326172, 19.452239990234375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 10.0, 14.0, 20.0, 17.0, 17.0, 20.0, 15.0, 29.0, 31.0, 26.0, 34.0, 35.0, 40.0, 41.0, 38.0, 41.0, 38.0, 49.0, 54.0, 35.0, 33.0, 32.0, 34.0, 37.0, 25.0, 26.0, 22.0, 22.0, 28.0, 21.0, 11.0, 15.0, 16.0, 8.0, 14.0, 4.0, 7.0, 3.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.244140625, -2.17034912109375, -2.0965576171875, -2.02276611328125, -1.948974609375, -1.87518310546875, -1.8013916015625, -1.72760009765625, -1.65380859375, -1.58001708984375, -1.5062255859375, -1.43243408203125, -1.358642578125, -1.28485107421875, -1.2110595703125, -1.13726806640625, -1.0634765625, -0.98968505859375, -0.9158935546875, -0.84210205078125, -0.768310546875, -0.69451904296875, -0.6207275390625, -0.54693603515625, -0.47314453125, -0.39935302734375, -0.3255615234375, -0.25177001953125, -0.177978515625, -0.10418701171875, -0.0303955078125, 0.04339599609375, 0.1171875, 0.19097900390625, 0.2647705078125, 0.33856201171875, 0.412353515625, 0.48614501953125, 0.5599365234375, 0.63372802734375, 0.70751953125, 0.78131103515625, 0.8551025390625, 0.92889404296875, 1.002685546875, 1.07647705078125, 1.1502685546875, 1.22406005859375, 1.2978515625, 1.37164306640625, 1.4454345703125, 1.51922607421875, 1.593017578125, 1.66680908203125, 1.7406005859375, 1.81439208984375, 1.88818359375, 1.96197509765625, 2.0357666015625, 2.10955810546875, 2.183349609375, 2.25714111328125, 2.3309326171875, 2.40472412109375, 2.478515625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 3.0, 10.0, 11.0, 16.0, 18.0, 32.0, 57.0, 80.0, 113.0, 147.0, 190.0, 278.0, 456.0, 674.0, 912.0, 1361.0, 1906.0, 2867.0, 3986.0, 5510.0, 8160.0, 11392.0, 16915.0, 24936.0, 38675.0, 61387.0, 106334.0, 283737.0, 216191.0, 95247.0, 56492.0, 35411.0, 23418.0, 15593.0, 10927.0, 7636.0, 5201.0, 3732.0, 2578.0, 1752.0, 1260.0, 893.0, 632.0, 461.0, 294.0, 200.0, 155.0, 103.0, 75.0, 46.0, 39.0, 18.0, 18.0, 10.0, 9.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.17133712768554688, -0.16579437255859375, -0.16025161743164062, -0.1547088623046875, -0.14916610717773438, -0.14362335205078125, -0.13808059692382812, -0.132537841796875, -0.12699508666992188, -0.12145233154296875, -0.11590957641601562, -0.1103668212890625, -0.10482406616210938, -0.09928131103515625, -0.09373855590820312, -0.08819580078125, -0.08265304565429688, -0.07711029052734375, -0.07156753540039062, -0.0660247802734375, -0.060482025146484375, -0.05493927001953125, -0.049396514892578125, -0.043853759765625, -0.038311004638671875, -0.03276824951171875, -0.027225494384765625, -0.0216827392578125, -0.016139984130859375, -0.01059722900390625, -0.005054473876953125, 0.00048828125, 0.006031036376953125, 0.01157379150390625, 0.017116546630859375, 0.0226593017578125, 0.028202056884765625, 0.03374481201171875, 0.039287567138671875, 0.044830322265625, 0.050373077392578125, 0.05591583251953125, 0.061458587646484375, 0.0670013427734375, 0.07254409790039062, 0.07808685302734375, 0.08362960815429688, 0.08917236328125, 0.09471511840820312, 0.10025787353515625, 0.10580062866210938, 0.1113433837890625, 0.11688613891601562, 0.12242889404296875, 0.12797164916992188, 0.133514404296875, 0.13905715942382812, 0.14459991455078125, 0.15014266967773438, 0.1556854248046875, 0.16122817993164062, 0.16677093505859375, 0.17231369018554688, 0.1778564453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 1.0, 3.0, 13.0, 10.0, 9.0, 7.0, 8.0, 15.0, 15.0, 18.0, 18.0, 24.0, 18.0, 27.0, 26.0, 34.0, 26.0, 31.0, 38.0, 26.0, 41.0, 42.0, 1067.0, 34.0, 38.0, 38.0, 43.0, 33.0, 39.0, 34.0, 27.0, 23.0, 22.0, 37.0, 13.0, 26.0, 19.0, 22.0, 14.0, 5.0, 8.0, 6.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.7744140625, -1.721649169921875, -1.66888427734375, -1.616119384765625, -1.5633544921875, -1.510589599609375, -1.45782470703125, -1.405059814453125, -1.352294921875, -1.299530029296875, -1.24676513671875, -1.194000244140625, -1.1412353515625, -1.088470458984375, -1.03570556640625, -0.982940673828125, -0.93017578125, -0.877410888671875, -0.82464599609375, -0.771881103515625, -0.7191162109375, -0.666351318359375, -0.61358642578125, -0.560821533203125, -0.508056640625, -0.455291748046875, -0.40252685546875, -0.349761962890625, -0.2969970703125, -0.244232177734375, -0.19146728515625, -0.138702392578125, -0.0859375, -0.033172607421875, 0.01959228515625, 0.072357177734375, 0.1251220703125, 0.177886962890625, 0.23065185546875, 0.283416748046875, 0.336181640625, 0.388946533203125, 0.44171142578125, 0.494476318359375, 0.5472412109375, 0.600006103515625, 0.65277099609375, 0.705535888671875, 0.75830078125, 0.811065673828125, 0.86383056640625, 0.916595458984375, 0.9693603515625, 1.022125244140625, 1.07489013671875, 1.127655029296875, 1.180419921875, 1.233184814453125, 1.28594970703125, 1.338714599609375, 1.3914794921875, 1.444244384765625, 1.49700927734375, 1.549774169921875, 1.6025390625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 12.0, 16.0, 23.0, 39.0, 57.0, 71.0, 91.0, 156.0, 229.0, 307.0, 426.0, 683.0, 927.0, 1397.0, 2038.0, 3054.0, 4560.0, 7022.0, 10734.0, 16953.0, 27272.0, 45428.0, 82090.0, 172746.0, 1406647.0, 137524.0, 69660.0, 39766.0, 23848.0, 14798.0, 9521.0, 6147.0, 4197.0, 2763.0, 1793.0, 1291.0, 877.0, 582.0, 444.0, 286.0, 201.0, 138.0, 90.0, 66.0, 57.0, 28.0, 15.0, 22.0, 16.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1068115234375, -0.10329437255859375, -0.0997772216796875, -0.09626007080078125, -0.092742919921875, -0.08922576904296875, -0.0857086181640625, -0.08219146728515625, -0.07867431640625, -0.07515716552734375, -0.0716400146484375, -0.06812286376953125, -0.064605712890625, -0.06108856201171875, -0.0575714111328125, -0.05405426025390625, -0.050537109375, -0.04701995849609375, -0.0435028076171875, -0.03998565673828125, -0.036468505859375, -0.03295135498046875, -0.0294342041015625, -0.02591705322265625, -0.02239990234375, -0.01888275146484375, -0.0153656005859375, -0.01184844970703125, -0.008331298828125, -0.00481414794921875, -0.0012969970703125, 0.00222015380859375, 0.0057373046875, 0.00925445556640625, 0.0127716064453125, 0.01628875732421875, 0.019805908203125, 0.02332305908203125, 0.0268402099609375, 0.03035736083984375, 0.03387451171875, 0.03739166259765625, 0.0409088134765625, 0.04442596435546875, 0.047943115234375, 0.05146026611328125, 0.0549774169921875, 0.05849456787109375, 0.06201171875, 0.06552886962890625, 0.0690460205078125, 0.07256317138671875, 0.076080322265625, 0.07959747314453125, 0.0831146240234375, 0.08663177490234375, 0.09014892578125, 0.09366607666015625, 0.0971832275390625, 0.10070037841796875, 0.104217529296875, 0.10773468017578125, 0.1112518310546875, 0.11476898193359375, 0.1182861328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 6.0, 11.0, 12.0, 13.0, 27.0, 36.0, 65.0, 140.0, 168.0, 166.0, 122.0, 55.0, 42.0, 23.0, 14.0, 9.0, 11.0, 5.0, 5.0, 13.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.811981201171875e-05, -1.744832843542099e-05, -1.677684485912323e-05, -1.610536128282547e-05, -1.543387770652771e-05, -1.476239413022995e-05, -1.409091055393219e-05, -1.341942697763443e-05, -1.274794340133667e-05, -1.207645982503891e-05, -1.140497624874115e-05, -1.073349267244339e-05, -1.006200909614563e-05, -9.39052551984787e-06, -8.71904194355011e-06, -8.04755836725235e-06, -7.37607479095459e-06, -6.70459121465683e-06, -6.03310763835907e-06, -5.36162406206131e-06, -4.69014048576355e-06, -4.01865690946579e-06, -3.3471733331680298e-06, -2.6756897568702698e-06, -2.0042061805725098e-06, -1.3327226042747498e-06, -6.612390279769897e-07, 1.0244548320770264e-08, 6.817281246185303e-07, 1.3532117009162903e-06, 2.0246952772140503e-06, 2.6961788535118103e-06, 3.3676624298095703e-06, 4.03914600610733e-06, 4.71062958240509e-06, 5.38211315870285e-06, 6.05359673500061e-06, 6.72508031129837e-06, 7.39656388759613e-06, 8.06804746389389e-06, 8.73953104019165e-06, 9.41101461648941e-06, 1.008249819278717e-05, 1.075398176908493e-05, 1.142546534538269e-05, 1.209694892168045e-05, 1.276843249797821e-05, 1.343991607427597e-05, 1.411139965057373e-05, 1.478288322687149e-05, 1.545436680316925e-05, 1.612585037946701e-05, 1.679733395576477e-05, 1.746881753206253e-05, 1.814030110836029e-05, 1.881178468465805e-05, 1.948326826095581e-05, 2.015475183725357e-05, 2.082623541355133e-05, 2.149771898984909e-05, 2.216920256614685e-05, 2.284068614244461e-05, 2.351216971874237e-05, 2.418365329504013e-05, 2.485513687133789e-05]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 0.0, 1.0, 7.0, 8.0, 8.0, 9.0, 18.0, 16.0, 18.0, 24.0, 31.0, 53.0, 69.0, 108.0, 194.0, 595.0, 4616.0, 54506.0, 847432.0, 130043.0, 9025.0, 1102.0, 249.0, 118.0, 75.0, 50.0, 41.0, 23.0, 23.0, 20.0, 15.0, 7.0, 11.0, 12.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.000324249267578125, -0.00031563639640808105, -0.0003070235252380371, -0.00029841065406799316, -0.0002897977828979492, -0.0002811849117279053, -0.00027257204055786133, -0.0002639591693878174, -0.00025534629821777344, -0.0002467334270477295, -0.00023812055587768555, -0.0002295076847076416, -0.00022089481353759766, -0.0002122819423675537, -0.00020366907119750977, -0.00019505620002746582, -0.00018644332885742188, -0.00017783045768737793, -0.00016921758651733398, -0.00016060471534729004, -0.0001519918441772461, -0.00014337897300720215, -0.0001347661018371582, -0.00012615323066711426, -0.00011754035949707031, -0.00010892748832702637, -0.00010031461715698242, -9.170174598693848e-05, -8.308887481689453e-05, -7.447600364685059e-05, -6.586313247680664e-05, -5.7250261306762695e-05, -4.863739013671875e-05, -4.0024518966674805e-05, -3.141164779663086e-05, -2.2798776626586914e-05, -1.4185905456542969e-05, -5.5730342864990234e-06, 3.039836883544922e-06, 1.1652708053588867e-05, 2.0265579223632812e-05, 2.8878450393676758e-05, 3.74913215637207e-05, 4.610419273376465e-05, 5.4717063903808594e-05, 6.332993507385254e-05, 7.194280624389648e-05, 8.055567741394043e-05, 8.916854858398438e-05, 9.778141975402832e-05, 0.00010639429092407227, 0.00011500716209411621, 0.00012362003326416016, 0.0001322329044342041, 0.00014084577560424805, 0.000149458646774292, 0.00015807151794433594, 0.00016668438911437988, 0.00017529726028442383, 0.00018391013145446777, 0.00019252300262451172, 0.00020113587379455566, 0.0002097487449645996, 0.00021836161613464355, 0.0002269744873046875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 16.0, 13.0, 26.0, 49.0, 57.0, 102.0, 150.0, 175.0, 163.0, 95.0, 61.0, 44.0, 14.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0653802494052798e-05, -1.990055534406565e-05, -1.9147308194078505e-05, -1.839406104409136e-05, -1.7640815713093616e-05, -1.688756856310647e-05, -1.6134321413119324e-05, -1.5381074263132177e-05, -1.4627828022639733e-05, -1.3874580872652587e-05, -1.3121334632160142e-05, -1.2368087482172996e-05, -1.161484033218585e-05, -1.0861594091693405e-05, -1.0108346941706259e-05, -9.355100701213814e-06, -8.601853551226668e-06, -7.848606401239522e-06, -7.095360160747077e-06, -6.342113010759931e-06, -5.588866315520136e-06, -4.83561962028034e-06, -4.082372470293194e-06, -3.3291257750533987e-06, -2.5758790798136033e-06, -1.8226322708869702e-06, -1.0693854619603371e-06, -3.161385393468663e-07, 4.3710815589292906e-07, 1.1903548511327244e-06, 1.9436020011198707e-06, 2.696848696359666e-06, 3.450097210588865e-06, 4.20334390582866e-06, 4.956590601068456e-06, 5.709837751055602e-06, 6.463084446295397e-06, 7.216331141535193e-06, 7.969578291522339e-06, 8.722825441509485e-06, 9.47607168200193e-06, 1.0229318831989076e-05, 1.098256507248152e-05, 1.1735812222468667e-05, 1.2489059372455813e-05, 1.3242305612948257e-05, 1.3995552762935404e-05, 1.4748799003427848e-05, 1.5502046153414994e-05, 1.625529330340214e-05, 1.7008540453389287e-05, 1.7761787603376433e-05, 1.8515032934374176e-05, 1.9268280084361322e-05, 2.002152723434847e-05, 2.0774774384335615e-05, 2.1528019715333357e-05, 2.2281266865320504e-05, 2.303451401530765e-05, 2.3787761165294796e-05, 2.454100649629254e-05, 2.5294253646279685e-05, 2.604750079626683e-05, 2.6800747946253978e-05, 2.7553995096241124e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 8.0, 5.0, 19.0, 17.0, 12.0, 12.0, 24.0, 27.0, 32.0, 26.0, 34.0, 35.0, 41.0, 32.0, 41.0, 41.0, 56.0, 65.0, 38.0, 37.0, 35.0, 41.0, 57.0, 46.0, 39.0, 28.0, 30.0, 20.0, 19.0, 10.0, 16.0, 14.0, 12.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.809380233287811e-06, -8.499249815940857e-06, -8.189119398593903e-06, -7.878988981246948e-06, -7.568858563899994e-06, -7.2587281465530396e-06, -6.948597729206085e-06, -6.638467311859131e-06, -6.3283368945121765e-06, -6.018206477165222e-06, -5.708076059818268e-06, -5.3979456424713135e-06, -5.087815225124359e-06, -4.777684807777405e-06, -4.4675543904304504e-06, -4.157423973083496e-06, -3.847293555736542e-06, -3.5371631383895874e-06, -3.227032721042633e-06, -2.9169023036956787e-06, -2.6067718863487244e-06, -2.29664146900177e-06, -1.9865110516548157e-06, -1.6763806343078613e-06, -1.366250216960907e-06, -1.0561197996139526e-06, -7.459893822669983e-07, -4.3585896492004395e-07, -1.257285475730896e-07, 1.8440186977386475e-07, 4.945322871208191e-07, 8.046627044677734e-07, 1.1147931218147278e-06, 1.4249235391616821e-06, 1.7350539565086365e-06, 2.045184373855591e-06, 2.355314791202545e-06, 2.6654452085494995e-06, 2.975575625896454e-06, 3.285706043243408e-06, 3.5958364605903625e-06, 3.905966877937317e-06, 4.216097295284271e-06, 4.526227712631226e-06, 4.83635812997818e-06, 5.146488547325134e-06, 5.456618964672089e-06, 5.766749382019043e-06, 6.076879799365997e-06, 6.387010216712952e-06, 6.697140634059906e-06, 7.00727105140686e-06, 7.317401468753815e-06, 7.627531886100769e-06, 7.937662303447723e-06, 8.247792720794678e-06, 8.557923138141632e-06, 8.868053555488586e-06, 9.17818397283554e-06, 9.488314390182495e-06, 9.79844480752945e-06, 1.0108575224876404e-05, 1.0418705642223358e-05, 1.0728836059570312e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 10.0, 14.0, 20.0, 17.0, 17.0, 20.0, 15.0, 29.0, 31.0, 26.0, 34.0, 35.0, 40.0, 41.0, 38.0, 41.0, 38.0, 49.0, 54.0, 35.0, 33.0, 32.0, 34.0, 37.0, 25.0, 26.0, 22.0, 22.0, 28.0, 21.0, 11.0, 15.0, 16.0, 8.0, 14.0, 4.0, 7.0, 3.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.244140625, -2.17034912109375, -2.0965576171875, -2.02276611328125, -1.948974609375, -1.87518310546875, -1.8013916015625, -1.72760009765625, -1.65380859375, -1.58001708984375, -1.5062255859375, -1.43243408203125, -1.358642578125, -1.28485107421875, -1.2110595703125, -1.13726806640625, -1.0634765625, -0.98968505859375, -0.9158935546875, -0.84210205078125, -0.768310546875, -0.69451904296875, -0.6207275390625, -0.54693603515625, -0.47314453125, -0.39935302734375, -0.3255615234375, -0.25177001953125, -0.177978515625, -0.10418701171875, -0.0303955078125, 0.04339599609375, 0.1171875, 0.19097900390625, 0.2647705078125, 0.33856201171875, 0.412353515625, 0.48614501953125, 0.5599365234375, 0.63372802734375, 0.70751953125, 0.78131103515625, 0.8551025390625, 0.92889404296875, 1.002685546875, 1.07647705078125, 1.1502685546875, 1.22406005859375, 1.2978515625, 1.37164306640625, 1.4454345703125, 1.51922607421875, 1.593017578125, 1.66680908203125, 1.7406005859375, 1.81439208984375, 1.88818359375, 1.96197509765625, 2.0357666015625, 2.10955810546875, 2.183349609375, 2.25714111328125, 2.3309326171875, 2.40472412109375, 2.478515625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 14.0, 27.0, 42.0, 87.0, 144.0, 223.0, 433.0, 765.0, 1450.0, 2560.0, 4899.0, 9555.0, 19117.0, 43607.0, 110221.0, 343579.0, 324576.0, 106478.0, 42023.0, 19074.0, 9307.0, 4790.0, 2602.0, 1374.0, 687.0, 344.0, 209.0, 121.0, 82.0, 53.0, 29.0, 24.0, 14.0, 8.0, 3.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.4561767578125, -2.353759765625, -2.2513427734375, -2.14892578125, -2.0465087890625, -1.944091796875, -1.8416748046875, -1.7392578125, -1.6368408203125, -1.534423828125, -1.4320068359375, -1.32958984375, -1.2271728515625, -1.124755859375, -1.0223388671875, -0.919921875, -0.8175048828125, -0.715087890625, -0.6126708984375, -0.51025390625, -0.4078369140625, -0.305419921875, -0.2030029296875, -0.1005859375, 0.0018310546875, 0.104248046875, 0.2066650390625, 0.30908203125, 0.4114990234375, 0.513916015625, 0.6163330078125, 0.71875, 0.8211669921875, 0.923583984375, 1.0260009765625, 1.12841796875, 1.2308349609375, 1.333251953125, 1.4356689453125, 1.5380859375, 1.6405029296875, 1.742919921875, 1.8453369140625, 1.94775390625, 2.0501708984375, 2.152587890625, 2.2550048828125, 2.357421875, 2.4598388671875, 2.562255859375, 2.6646728515625, 2.76708984375, 2.8695068359375, 2.971923828125, 3.0743408203125, 3.1767578125, 3.2791748046875, 3.381591796875, 3.4840087890625, 3.58642578125, 3.6888427734375, 3.791259765625, 3.8936767578125, 3.99609375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 9.0, 8.0, 11.0, 13.0, 12.0, 16.0, 13.0, 19.0, 25.0, 28.0, 31.0, 37.0, 46.0, 47.0, 59.0, 59.0, 91.0, 183.0, 1632.0, 169.0, 78.0, 65.0, 51.0, 46.0, 41.0, 27.0, 34.0, 33.0, 24.0, 20.0, 18.0, 19.0, 14.0, 12.0, 9.0, 10.0, 5.0, 4.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.8203125, -8.5484619140625, -8.276611328125, -8.0047607421875, -7.73291015625, -7.4610595703125, -7.189208984375, -6.9173583984375, -6.6455078125, -6.3736572265625, -6.101806640625, -5.8299560546875, -5.55810546875, -5.2862548828125, -5.014404296875, -4.7425537109375, -4.470703125, -4.1988525390625, -3.927001953125, -3.6551513671875, -3.38330078125, -3.1114501953125, -2.839599609375, -2.5677490234375, -2.2958984375, -2.0240478515625, -1.752197265625, -1.4803466796875, -1.20849609375, -0.9366455078125, -0.664794921875, -0.3929443359375, -0.12109375, 0.1507568359375, 0.422607421875, 0.6944580078125, 0.96630859375, 1.2381591796875, 1.510009765625, 1.7818603515625, 2.0537109375, 2.3255615234375, 2.597412109375, 2.8692626953125, 3.14111328125, 3.4129638671875, 3.684814453125, 3.9566650390625, 4.228515625, 4.5003662109375, 4.772216796875, 5.0440673828125, 5.31591796875, 5.5877685546875, 5.859619140625, 6.1314697265625, 6.4033203125, 6.6751708984375, 6.947021484375, 7.2188720703125, 7.49072265625, 7.7625732421875, 8.034423828125, 8.3062744140625, 8.578125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 3.0, 9.0, 12.0, 13.0, 18.0, 24.0, 18.0, 38.0, 38.0, 74.0, 71.0, 104.0, 136.0, 242.0, 387.0, 867.0, 2978.0, 18669.0, 302971.0, 2736681.0, 71396.0, 7719.0, 1577.0, 622.0, 319.0, 190.0, 133.0, 92.0, 72.0, 44.0, 36.0, 25.0, 21.0, 14.0, 19.0, 13.0, 7.0, 15.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-13.375, -12.9473876953125, -12.519775390625, -12.0921630859375, -11.66455078125, -11.2369384765625, -10.809326171875, -10.3817138671875, -9.9541015625, -9.5264892578125, -9.098876953125, -8.6712646484375, -8.24365234375, -7.8160400390625, -7.388427734375, -6.9608154296875, -6.533203125, -6.1055908203125, -5.677978515625, -5.2503662109375, -4.82275390625, -4.3951416015625, -3.967529296875, -3.5399169921875, -3.1123046875, -2.6846923828125, -2.257080078125, -1.8294677734375, -1.40185546875, -0.9742431640625, -0.546630859375, -0.1190185546875, 0.30859375, 0.7362060546875, 1.163818359375, 1.5914306640625, 2.01904296875, 2.4466552734375, 2.874267578125, 3.3018798828125, 3.7294921875, 4.1571044921875, 4.584716796875, 5.0123291015625, 5.43994140625, 5.8675537109375, 6.295166015625, 6.7227783203125, 7.150390625, 7.5780029296875, 8.005615234375, 8.4332275390625, 8.86083984375, 9.2884521484375, 9.716064453125, 10.1436767578125, 10.5712890625, 10.9989013671875, 11.426513671875, 11.8541259765625, 12.28173828125, 12.7093505859375, 13.136962890625, 13.5645751953125, 13.9921875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [5.0, 68.0, 645.0, 289.0, 13.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.742936134338379, -6.887946128845215, -3.032956123352051, 0.8220338821411133, 4.677023887634277, 8.532013893127441, 12.387003898620605, 16.241992950439453, 20.09698486328125, 23.951974868774414, 27.806964874267578, 31.661954879760742, 35.516944885253906, 39.37193298339844, 43.226924896240234, 47.08191680908203, 50.93690490722656, 54.791893005371094, 58.64688491821289, 62.50187683105469, 66.35686492919922, 70.21185302734375, 74.06684875488281, 77.92183685302734, 81.77682495117188, 85.6318130493164, 89.48680114746094, 93.341796875, 97.19678497314453, 101.05177307128906, 104.90676879882812, 108.76175689697266, 112.61674499511719, 116.47173309326172, 120.32672119140625, 124.18171691894531, 128.03671264648438, 131.89169311523438, 135.74668884277344, 139.60166931152344, 143.4566650390625, 147.31166076660156, 151.16664123535156, 155.02163696289062, 158.87661743164062, 162.7316131591797, 166.58660888671875, 170.44158935546875, 174.2965850830078, 178.15158081054688, 182.00656127929688, 185.86155700683594, 189.716552734375, 193.571533203125, 197.42652893066406, 201.28150939941406, 205.13650512695312, 208.9915008544922, 212.8464813232422, 216.70147705078125, 220.55645751953125, 224.4114532470703, 228.26644897460938, 232.12142944335938, 235.97642517089844]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 10.0, 15.0, 11.0, 6.0, 23.0, 12.0, 21.0, 26.0, 40.0, 24.0, 28.0, 51.0, 34.0, 48.0, 48.0, 36.0, 46.0, 41.0, 38.0, 38.0, 33.0, 37.0, 45.0, 37.0, 33.0, 26.0, 27.0, 25.0, 21.0, 19.0, 18.0, 6.0, 15.0, 12.0, 7.0, 2.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.223691940307617, -24.327669143676758, -23.4316463470459, -22.53562355041504, -21.639598846435547, -20.743576049804688, -19.847553253173828, -18.95153045654297, -18.05550765991211, -17.15948486328125, -16.26346206665039, -15.367438316345215, -14.471415519714355, -13.575392723083496, -12.67936897277832, -11.783346176147461, -10.887323379516602, -9.991300582885742, -9.095277786254883, -8.199254035949707, -7.303231239318848, -6.407208442687988, -5.511185169219971, -4.615161895751953, -3.7191390991210938, -2.8231160640716553, -1.9270930290222168, -1.0310699939727783, -0.13504695892333984, 0.7609758377075195, 1.656999111175537, 2.5530223846435547, 3.4490432739257812, 4.345066070556641, 5.241089344024658, 6.137112617492676, 7.033135414123535, 7.9291582107543945, 8.82518196105957, 9.72120475769043, 10.617227554321289, 11.513250350952148, 12.409273147583008, 13.305296897888184, 14.201319694519043, 15.097342491149902, 15.993366241455078, 16.889389038085938, 17.785411834716797, 18.681434631347656, 19.577457427978516, 20.473480224609375, 21.369503021240234, 22.265525817871094, 23.161550521850586, 24.057573318481445, 24.953596115112305, 25.849618911743164, 26.745641708374023, 27.641664505004883, 28.537689208984375, 29.433712005615234, 30.329734802246094, 31.225757598876953, 32.12178039550781]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 9.0, 9.0, 10.0, 18.0, 12.0, 20.0, 16.0, 20.0, 16.0, 32.0, 23.0, 23.0, 39.0, 37.0, 36.0, 25.0, 44.0, 40.0, 43.0, 44.0, 45.0, 46.0, 31.0, 22.0, 38.0, 29.0, 33.0, 26.0, 29.0, 23.0, 15.0, 17.0, 28.0, 14.0, 9.0, 12.0, 18.0, 11.0, 3.0, 6.0, 4.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.302734375, -2.23004150390625, -2.1573486328125, -2.08465576171875, -2.011962890625, -1.93927001953125, -1.8665771484375, -1.79388427734375, -1.72119140625, -1.64849853515625, -1.5758056640625, -1.50311279296875, -1.430419921875, -1.35772705078125, -1.2850341796875, -1.21234130859375, -1.1396484375, -1.06695556640625, -0.9942626953125, -0.92156982421875, -0.848876953125, -0.77618408203125, -0.7034912109375, -0.63079833984375, -0.55810546875, -0.48541259765625, -0.4127197265625, -0.34002685546875, -0.267333984375, -0.19464111328125, -0.1219482421875, -0.04925537109375, 0.0234375, 0.09613037109375, 0.1688232421875, 0.24151611328125, 0.314208984375, 0.38690185546875, 0.4595947265625, 0.53228759765625, 0.60498046875, 0.67767333984375, 0.7503662109375, 0.82305908203125, 0.895751953125, 0.96844482421875, 1.0411376953125, 1.11383056640625, 1.1865234375, 1.25921630859375, 1.3319091796875, 1.40460205078125, 1.477294921875, 1.54998779296875, 1.6226806640625, 1.69537353515625, 1.76806640625, 1.84075927734375, 1.9134521484375, 1.98614501953125, 2.058837890625, 2.13153076171875, 2.2042236328125, 2.27691650390625, 2.349609375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 10.0, 20.0, 34.0, 44.0, 76.0, 97.0, 182.0, 239.0, 409.0, 715.0, 1208.0, 2248.0, 4350.0, 8919.0, 19510.0, 47338.0, 132411.0, 484775.0, 1917832.0, 1175895.0, 256650.0, 81484.0, 31940.0, 13784.0, 6587.0, 3274.0, 1765.0, 967.0, 567.0, 319.0, 201.0, 141.0, 81.0, 66.0, 43.0, 28.0, 22.0, 13.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.728515625, -3.583892822265625, -3.43927001953125, -3.294647216796875, -3.1500244140625, -3.005401611328125, -2.86077880859375, -2.716156005859375, -2.571533203125, -2.426910400390625, -2.28228759765625, -2.137664794921875, -1.9930419921875, -1.848419189453125, -1.70379638671875, -1.559173583984375, -1.41455078125, -1.269927978515625, -1.12530517578125, -0.980682373046875, -0.8360595703125, -0.691436767578125, -0.54681396484375, -0.402191162109375, -0.257568359375, -0.112945556640625, 0.03167724609375, 0.176300048828125, 0.3209228515625, 0.465545654296875, 0.61016845703125, 0.754791259765625, 0.8994140625, 1.044036865234375, 1.18865966796875, 1.333282470703125, 1.4779052734375, 1.622528076171875, 1.76715087890625, 1.911773681640625, 2.056396484375, 2.201019287109375, 2.34564208984375, 2.490264892578125, 2.6348876953125, 2.779510498046875, 2.92413330078125, 3.068756103515625, 3.21337890625, 3.358001708984375, 3.50262451171875, 3.647247314453125, 3.7918701171875, 3.936492919921875, 4.08111572265625, 4.225738525390625, 4.370361328125, 4.514984130859375, 4.65960693359375, 4.804229736328125, 4.9488525390625, 5.093475341796875, 5.23809814453125, 5.382720947265625, 5.52734375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 13.0, 16.0, 25.0, 43.0, 93.0, 189.0, 328.0, 527.0, 940.0, 809.0, 487.0, 258.0, 149.0, 91.0, 50.0, 25.0, 8.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.9296875, -15.5396728515625, -15.149658203125, -14.7596435546875, -14.36962890625, -13.9796142578125, -13.589599609375, -13.1995849609375, -12.8095703125, -12.4195556640625, -12.029541015625, -11.6395263671875, -11.24951171875, -10.8594970703125, -10.469482421875, -10.0794677734375, -9.689453125, -9.2994384765625, -8.909423828125, -8.5194091796875, -8.12939453125, -7.7393798828125, -7.349365234375, -6.9593505859375, -6.5693359375, -6.1793212890625, -5.789306640625, -5.3992919921875, -5.00927734375, -4.6192626953125, -4.229248046875, -3.8392333984375, -3.44921875, -3.0592041015625, -2.669189453125, -2.2791748046875, -1.88916015625, -1.4991455078125, -1.109130859375, -0.7191162109375, -0.3291015625, 0.0609130859375, 0.450927734375, 0.8409423828125, 1.23095703125, 1.6209716796875, 2.010986328125, 2.4010009765625, 2.791015625, 3.1810302734375, 3.571044921875, 3.9610595703125, 4.35107421875, 4.7410888671875, 5.131103515625, 5.5211181640625, 5.9111328125, 6.3011474609375, 6.691162109375, 7.0811767578125, 7.47119140625, 7.8612060546875, 8.251220703125, 8.6412353515625, 9.03125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 10.0, 23.0, 14.0, 22.0, 48.0, 44.0, 60.0, 88.0, 126.0, 271.0, 571.0, 1938.0, 8077.0, 61024.0, 914612.0, 2991200.0, 191407.0, 19470.0, 3350.0, 973.0, 380.0, 215.0, 92.0, 66.0, 53.0, 46.0, 32.0, 18.0, 13.0, 7.0, 9.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.953125, -16.392333984375, -15.83154296875, -15.270751953125, -14.7099609375, -14.149169921875, -13.58837890625, -13.027587890625, -12.466796875, -11.906005859375, -11.34521484375, -10.784423828125, -10.2236328125, -9.662841796875, -9.10205078125, -8.541259765625, -7.98046875, -7.419677734375, -6.85888671875, -6.298095703125, -5.7373046875, -5.176513671875, -4.61572265625, -4.054931640625, -3.494140625, -2.933349609375, -2.37255859375, -1.811767578125, -1.2509765625, -0.690185546875, -0.12939453125, 0.431396484375, 0.9921875, 1.552978515625, 2.11376953125, 2.674560546875, 3.2353515625, 3.796142578125, 4.35693359375, 4.917724609375, 5.478515625, 6.039306640625, 6.60009765625, 7.160888671875, 7.7216796875, 8.282470703125, 8.84326171875, 9.404052734375, 9.96484375, 10.525634765625, 11.08642578125, 11.647216796875, 12.2080078125, 12.768798828125, 13.32958984375, 13.890380859375, 14.451171875, 15.011962890625, 15.57275390625, 16.133544921875, 16.6943359375, 17.255126953125, 17.81591796875, 18.376708984375, 18.9375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 24.0, 50.0, 50.0, 66.0, 96.0, 131.0, 142.0, 122.0, 119.0, 66.0, 52.0, 35.0, 22.0, 11.0, 7.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-77.07830047607422, -75.45429992675781, -73.8302993774414, -72.206298828125, -70.5822982788086, -68.95829772949219, -67.33429718017578, -65.71029663085938, -64.08629608154297, -62.46229553222656, -60.838294982910156, -59.21429443359375, -57.590293884277344, -55.96629333496094, -54.34229278564453, -52.71828842163086, -51.09428405761719, -49.47028350830078, -47.846282958984375, -46.22228240966797, -44.59828186035156, -42.974281311035156, -41.35028076171875, -39.72627639770508, -38.10227966308594, -36.47827911376953, -34.854278564453125, -33.23027801513672, -31.60627555847168, -29.982275009155273, -28.358274459838867, -26.734272003173828, -25.110273361206055, -23.48627281188965, -21.862272262573242, -20.238269805908203, -18.614269256591797, -16.99026870727539, -15.366268157958984, -13.742266654968262, -12.118266105651855, -10.49426555633545, -8.870264053344727, -7.24626350402832, -5.622262477874756, -3.9982614517211914, -2.374260902404785, -0.7502593994140625, 0.8737411499023438, 2.497742176055908, 4.121743202209473, 5.745743751525879, 7.369744777679443, 8.993745803833008, 10.617746353149414, 12.241747856140137, 13.865748405456543, 15.48974895477295, 17.113750457763672, 18.737751007080078, 20.361751556396484, 21.98575210571289, 23.609752655029297, 25.233755111694336, 26.857755661010742]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 6.0, 9.0, 13.0, 8.0, 16.0, 26.0, 23.0, 29.0, 24.0, 30.0, 22.0, 32.0, 35.0, 30.0, 47.0, 39.0, 40.0, 48.0, 48.0, 38.0, 48.0, 49.0, 39.0, 40.0, 42.0, 29.0, 37.0, 27.0, 18.0, 17.0, 15.0, 7.0, 9.0, 14.0, 11.0, 8.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.792633056640625, -22.01926040649414, -21.24588966369629, -20.472517013549805, -19.699146270751953, -18.92577362060547, -18.152400970458984, -17.379030227661133, -16.60565757751465, -15.83228588104248, -15.058914184570312, -14.285541534423828, -13.51216983795166, -12.738798141479492, -11.965426445007324, -11.192054748535156, -10.418683052062988, -9.64531135559082, -8.871939659118652, -8.098567962646484, -7.3251953125, -6.551823616027832, -5.778451919555664, -5.005079746246338, -4.23170804977417, -3.458336114883423, -2.684964179992676, -1.9115924835205078, -1.1382205486297607, -0.36484861373901367, 0.4085230827331543, 1.1818952560424805, 1.9552669525146484, 2.7286388874053955, 3.5020108222961426, 4.2753825187683105, 5.048754692077637, 5.822126388549805, 6.595498085021973, 7.368870258331299, 8.142242431640625, 8.915614128112793, 9.688985824584961, 10.462358474731445, 11.235730171203613, 12.009101867675781, 12.78247356414795, 13.555845260620117, 14.329216957092285, 15.102588653564453, 15.875960350036621, 16.64933204650879, 17.422704696655273, 18.196075439453125, 18.96944808959961, 19.742820739746094, 20.516191482543945, 21.28956413269043, 22.06293487548828, 22.836307525634766, 23.609678268432617, 24.3830509185791, 25.156421661376953, 25.929794311523438, 26.703166961669922]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 4.0, 8.0, 16.0, 12.0, 14.0, 19.0, 26.0, 22.0, 17.0, 23.0, 26.0, 38.0, 35.0, 42.0, 49.0, 31.0, 50.0, 41.0, 51.0, 41.0, 42.0, 40.0, 31.0, 34.0, 28.0, 32.0, 25.0, 30.0, 27.0, 28.0, 17.0, 20.0, 12.0, 11.0, 14.0, 4.0, 6.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.583984375, -2.501953125, -2.419921875, -2.337890625, -2.255859375, -2.173828125, -2.091796875, -2.009765625, -1.927734375, -1.845703125, -1.763671875, -1.681640625, -1.599609375, -1.517578125, -1.435546875, -1.353515625, -1.271484375, -1.189453125, -1.107421875, -1.025390625, -0.943359375, -0.861328125, -0.779296875, -0.697265625, -0.615234375, -0.533203125, -0.451171875, -0.369140625, -0.287109375, -0.205078125, -0.123046875, -0.041015625, 0.041015625, 0.123046875, 0.205078125, 0.287109375, 0.369140625, 0.451171875, 0.533203125, 0.615234375, 0.697265625, 0.779296875, 0.861328125, 0.943359375, 1.025390625, 1.107421875, 1.189453125, 1.271484375, 1.353515625, 1.435546875, 1.517578125, 1.599609375, 1.681640625, 1.763671875, 1.845703125, 1.927734375, 2.009765625, 2.091796875, 2.173828125, 2.255859375, 2.337890625, 2.419921875, 2.501953125, 2.583984375, 2.666015625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 12.0, 13.0, 16.0, 24.0, 45.0, 58.0, 88.0, 141.0, 164.0, 237.0, 368.0, 490.0, 710.0, 1008.0, 1444.0, 2024.0, 2980.0, 4239.0, 6196.0, 9198.0, 13424.0, 20040.0, 30449.0, 48001.0, 80327.0, 152211.0, 327984.0, 137984.0, 75034.0, 45052.0, 29012.0, 18952.0, 12665.0, 8681.0, 5883.0, 4100.0, 2864.0, 1937.0, 1359.0, 967.0, 643.0, 472.0, 302.0, 232.0, 160.0, 107.0, 90.0, 53.0, 34.0, 33.0, 11.0, 12.0, 10.0, 9.0, 2.0, 4.0, 1.0, 3.0], "bins": [-0.1917724609375, -0.18585968017578125, -0.1799468994140625, -0.17403411865234375, -0.168121337890625, -0.16220855712890625, -0.1562957763671875, -0.15038299560546875, -0.14447021484375, -0.13855743408203125, -0.1326446533203125, -0.12673187255859375, -0.120819091796875, -0.11490631103515625, -0.1089935302734375, -0.10308074951171875, -0.09716796875, -0.09125518798828125, -0.0853424072265625, -0.07942962646484375, -0.073516845703125, -0.06760406494140625, -0.0616912841796875, -0.05577850341796875, -0.04986572265625, -0.04395294189453125, -0.0380401611328125, -0.03212738037109375, -0.026214599609375, -0.02030181884765625, -0.0143890380859375, -0.00847625732421875, -0.0025634765625, 0.00334930419921875, 0.0092620849609375, 0.01517486572265625, 0.021087646484375, 0.02700042724609375, 0.0329132080078125, 0.03882598876953125, 0.04473876953125, 0.05065155029296875, 0.0565643310546875, 0.06247711181640625, 0.068389892578125, 0.07430267333984375, 0.0802154541015625, 0.08612823486328125, 0.092041015625, 0.09795379638671875, 0.1038665771484375, 0.10977935791015625, 0.115692138671875, 0.12160491943359375, 0.1275177001953125, 0.13343048095703125, 0.13934326171875, 0.14525604248046875, 0.1511688232421875, 0.15708160400390625, 0.162994384765625, 0.16890716552734375, 0.1748199462890625, 0.18073272705078125, 0.1866455078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 11.0, 14.0, 12.0, 20.0, 13.0, 16.0, 12.0, 19.0, 28.0, 26.0, 28.0, 29.0, 24.0, 33.0, 45.0, 37.0, 45.0, 43.0, 1066.0, 36.0, 36.0, 36.0, 38.0, 42.0, 27.0, 34.0, 38.0, 28.0, 26.0, 14.0, 17.0, 22.0, 12.0, 16.0, 11.0, 7.0, 11.0, 7.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7294921875, -1.67449951171875, -1.6195068359375, -1.56451416015625, -1.509521484375, -1.45452880859375, -1.3995361328125, -1.34454345703125, -1.28955078125, -1.23455810546875, -1.1795654296875, -1.12457275390625, -1.069580078125, -1.01458740234375, -0.9595947265625, -0.90460205078125, -0.849609375, -0.79461669921875, -0.7396240234375, -0.68463134765625, -0.629638671875, -0.57464599609375, -0.5196533203125, -0.46466064453125, -0.40966796875, -0.35467529296875, -0.2996826171875, -0.24468994140625, -0.189697265625, -0.13470458984375, -0.0797119140625, -0.02471923828125, 0.0302734375, 0.08526611328125, 0.1402587890625, 0.19525146484375, 0.250244140625, 0.30523681640625, 0.3602294921875, 0.41522216796875, 0.47021484375, 0.52520751953125, 0.5802001953125, 0.63519287109375, 0.690185546875, 0.74517822265625, 0.8001708984375, 0.85516357421875, 0.91015625, 0.96514892578125, 1.0201416015625, 1.07513427734375, 1.130126953125, 1.18511962890625, 1.2401123046875, 1.29510498046875, 1.35009765625, 1.40509033203125, 1.4600830078125, 1.51507568359375, 1.570068359375, 1.62506103515625, 1.6800537109375, 1.73504638671875, 1.7900390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 9.0, 17.0, 28.0, 26.0, 48.0, 61.0, 77.0, 134.0, 219.0, 284.0, 426.0, 631.0, 859.0, 1258.0, 1923.0, 2886.0, 4359.0, 6410.0, 10042.0, 15654.0, 25275.0, 42407.0, 75889.0, 161223.0, 1421032.0, 146990.0, 71522.0, 40126.0, 23801.0, 15030.0, 9473.0, 6227.0, 4179.0, 2721.0, 1857.0, 1273.0, 898.0, 587.0, 375.0, 279.0, 201.0, 121.0, 98.0, 69.0, 35.0, 32.0, 23.0, 13.0, 7.0, 5.0, 8.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1187744140625, -0.11511421203613281, -0.11145401000976562, -0.10779380798339844, -0.10413360595703125, -0.10047340393066406, -0.09681320190429688, -0.09315299987792969, -0.0894927978515625, -0.08583259582519531, -0.08217239379882812, -0.07851219177246094, -0.07485198974609375, -0.07119178771972656, -0.06753158569335938, -0.06387138366699219, -0.060211181640625, -0.05655097961425781, -0.052890777587890625, -0.04923057556152344, -0.04557037353515625, -0.04191017150878906, -0.038249969482421875, -0.03458976745605469, -0.0309295654296875, -0.027269363403320312, -0.023609161376953125, -0.019948959350585938, -0.01628875732421875, -0.012628555297851562, -0.008968353271484375, -0.0053081512451171875, -0.00164794921875, 0.0020122528076171875, 0.005672454833984375, 0.009332656860351562, 0.01299285888671875, 0.016653060913085938, 0.020313262939453125, 0.023973464965820312, 0.0276336669921875, 0.03129386901855469, 0.034954071044921875, 0.03861427307128906, 0.04227447509765625, 0.04593467712402344, 0.049594879150390625, 0.05325508117675781, 0.056915283203125, 0.06057548522949219, 0.06423568725585938, 0.06789588928222656, 0.07155609130859375, 0.07521629333496094, 0.07887649536132812, 0.08253669738769531, 0.0861968994140625, 0.08985710144042969, 0.09351730346679688, 0.09717750549316406, 0.10083770751953125, 0.10449790954589844, 0.10815811157226562, 0.11181831359863281, 0.115478515625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 5.0, 8.0, 8.0, 13.0, 14.0, 19.0, 18.0, 17.0, 29.0, 38.0, 51.0, 64.0, 102.0, 148.0, 114.0, 56.0, 62.0, 36.0, 40.0, 24.0, 13.0, 18.0, 18.0, 24.0, 6.0, 8.0, 7.0, 3.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-05, -9.79006290435791e-06, -9.447336196899414e-06, -9.104609489440918e-06, -8.761882781982422e-06, -8.419156074523926e-06, -8.07642936706543e-06, -7.733702659606934e-06, -7.3909759521484375e-06, -7.048249244689941e-06, -6.705522537231445e-06, -6.362795829772949e-06, -6.020069122314453e-06, -5.677342414855957e-06, -5.334615707397461e-06, -4.991888999938965e-06, -4.649162292480469e-06, -4.306435585021973e-06, -3.9637088775634766e-06, -3.6209821701049805e-06, -3.2782554626464844e-06, -2.9355287551879883e-06, -2.592802047729492e-06, -2.250075340270996e-06, -1.9073486328125e-06, -1.564621925354004e-06, -1.2218952178955078e-06, -8.791685104370117e-07, -5.364418029785156e-07, -1.9371509552001953e-07, 1.4901161193847656e-07, 4.917383193969727e-07, 8.344650268554688e-07, 1.1771917343139648e-06, 1.519918441772461e-06, 1.862645149230957e-06, 2.205371856689453e-06, 2.5480985641479492e-06, 2.8908252716064453e-06, 3.2335519790649414e-06, 3.5762786865234375e-06, 3.919005393981934e-06, 4.26173210144043e-06, 4.604458808898926e-06, 4.947185516357422e-06, 5.289912223815918e-06, 5.632638931274414e-06, 5.97536563873291e-06, 6.318092346191406e-06, 6.660819053649902e-06, 7.0035457611083984e-06, 7.3462724685668945e-06, 7.68899917602539e-06, 8.031725883483887e-06, 8.374452590942383e-06, 8.717179298400879e-06, 9.059906005859375e-06, 9.402632713317871e-06, 9.745359420776367e-06, 1.0088086128234863e-05, 1.043081283569336e-05, 1.0773539543151855e-05, 1.1116266250610352e-05, 1.1458992958068848e-05, 1.1801719665527344e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 11.0, 12.0, 13.0, 19.0, 33.0, 28.0, 55.0, 69.0, 150.0, 306.0, 1025.0, 5096.0, 27202.0, 207398.0, 717691.0, 73765.0, 12099.0, 2489.0, 570.0, 182.0, 102.0, 54.0, 37.0, 30.0, 21.0, 23.0, 10.0, 12.0, 8.0, 4.0, 8.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020444393157958984, -0.0001984778791666031, -0.00019251182675361633, -0.00018654577434062958, -0.00018057972192764282, -0.00017461366951465607, -0.0001686476171016693, -0.00016268156468868256, -0.0001567155122756958, -0.00015074945986270905, -0.0001447834074497223, -0.00013881735503673553, -0.00013285130262374878, -0.00012688525021076202, -0.00012091919779777527, -0.00011495314538478851, -0.00010898709297180176, -0.000103021040558815, -9.705498814582825e-05, -9.108893573284149e-05, -8.512288331985474e-05, -7.915683090686798e-05, -7.319077849388123e-05, -6.722472608089447e-05, -6.125867366790771e-05, -5.529262125492096e-05, -4.9326568841934204e-05, -4.336051642894745e-05, -3.739446401596069e-05, -3.142841160297394e-05, -2.5462359189987183e-05, -1.9496306777000427e-05, -1.3530254364013672e-05, -7.5642019510269165e-06, -1.5981495380401611e-06, 4.367902874946594e-06, 1.033395528793335e-05, 1.6300007700920105e-05, 2.226606011390686e-05, 2.8232112526893616e-05, 3.419816493988037e-05, 4.0164217352867126e-05, 4.613026976585388e-05, 5.209632217884064e-05, 5.806237459182739e-05, 6.402842700481415e-05, 6.99944794178009e-05, 7.596053183078766e-05, 8.192658424377441e-05, 8.789263665676117e-05, 9.385868906974792e-05, 9.982474148273468e-05, 0.00010579079389572144, 0.00011175684630870819, 0.00011772289872169495, 0.0001236889511346817, 0.00012965500354766846, 0.0001356210559606552, 0.00014158710837364197, 0.00014755316078662872, 0.00015351921319961548, 0.00015948526561260223, 0.000165451318025589, 0.00017141737043857574, 0.0001773834228515625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 12.0, 24.0, 58.0, 97.0, 187.0, 227.0, 186.0, 109.0, 50.0, 22.0, 8.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8223125152871944e-05, -1.7181559087475762e-05, -1.6139994841068983e-05, -1.50984287756728e-05, -1.405686361977132e-05, -1.301529846386984e-05, -1.1973732398473658e-05, -1.0932167242572177e-05, -9.890602086670697e-06, -8.849036930769216e-06, -7.807471774867736e-06, -6.7659057094715536e-06, -5.724340553570073e-06, -4.682775397668593e-06, -3.6412097870197613e-06, -2.59964417637093e-06, -1.5580790204694495e-06, -5.165136371942936e-07, 5.250517460808624e-07, 1.5666171293560183e-06, 2.608182512631174e-06, 3.6497476685326546e-06, 4.691313279181486e-06, 5.732878889830317e-06, 6.774444045731798e-06, 7.816009201633278e-06, 8.857574357534759e-06, 9.899140422930941e-06, 1.0940705578832421e-05, 1.1982270734733902e-05, 1.3023836800130084e-05, 1.4065401956031565e-05, 1.5106965292943642e-05, 1.6148531358339824e-05, 1.7190095604746602e-05, 1.8231661670142785e-05, 1.9273225916549563e-05, 2.0314791981945746e-05, 2.1356358047341928e-05, 2.2397922293748707e-05, 2.343948835914489e-05, 2.448105442454107e-05, 2.552261867094785e-05, 2.6564184736344032e-05, 2.7605750801740214e-05, 2.8647315048146993e-05, 2.9688881113543175e-05, 3.073044717893936e-05, 3.1772011425346136e-05, 3.2813575671752915e-05, 3.38551435561385e-05, 3.489670780254528e-05, 3.593827204895206e-05, 3.697983629535884e-05, 3.802140417974442e-05, 3.90629684261512e-05, 4.010453267255798e-05, 4.114609691896476e-05, 4.2187664803350344e-05, 4.322922904975712e-05, 4.42707932961639e-05, 4.531235754257068e-05, 4.6353925426956266e-05, 4.7395489673363045e-05, 4.843705755774863e-05]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 0.0, 2.0, 8.0, 7.0, 9.0, 6.0, 11.0, 20.0, 23.0, 14.0, 34.0, 23.0, 14.0, 33.0, 34.0, 18.0, 50.0, 53.0, 27.0, 49.0, 60.0, 33.0, 54.0, 51.0, 30.0, 39.0, 46.0, 19.0, 32.0, 26.0, 19.0, 24.0, 23.0, 12.0, 25.0, 16.0, 7.0, 17.0, 11.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-5.245208740234375e-06, -5.085952579975128e-06, -4.926696419715881e-06, -4.7674402594566345e-06, -4.608184099197388e-06, -4.448927938938141e-06, -4.289671778678894e-06, -4.130415618419647e-06, -3.9711594581604e-06, -3.8119032979011536e-06, -3.6526471376419067e-06, -3.49339097738266e-06, -3.334134817123413e-06, -3.1748786568641663e-06, -3.0156224966049194e-06, -2.8563663363456726e-06, -2.6971101760864258e-06, -2.537854015827179e-06, -2.378597855567932e-06, -2.2193416953086853e-06, -2.0600855350494385e-06, -1.9008293747901917e-06, -1.7415732145309448e-06, -1.582317054271698e-06, -1.4230608940124512e-06, -1.2638047337532043e-06, -1.1045485734939575e-06, -9.452924132347107e-07, -7.860362529754639e-07, -6.26780092716217e-07, -4.675239324569702e-07, -3.082677721977234e-07, -1.4901161193847656e-07, 1.0244548320770264e-08, 1.695007085800171e-07, 3.287568688392639e-07, 4.880130290985107e-07, 6.472691893577576e-07, 8.065253496170044e-07, 9.657815098762512e-07, 1.125037670135498e-06, 1.2842938303947449e-06, 1.4435499906539917e-06, 1.6028061509132385e-06, 1.7620623111724854e-06, 1.921318471431732e-06, 2.080574631690979e-06, 2.239830791950226e-06, 2.3990869522094727e-06, 2.5583431124687195e-06, 2.7175992727279663e-06, 2.876855432987213e-06, 3.03611159324646e-06, 3.1953677535057068e-06, 3.3546239137649536e-06, 3.5138800740242004e-06, 3.6731362342834473e-06, 3.832392394542694e-06, 3.991648554801941e-06, 4.150904715061188e-06, 4.3101608753204346e-06, 4.469417035579681e-06, 4.628673195838928e-06, 4.787929356098175e-06, 4.947185516357422e-06]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 4.0, 8.0, 16.0, 12.0, 14.0, 19.0, 26.0, 22.0, 17.0, 23.0, 26.0, 38.0, 35.0, 42.0, 49.0, 31.0, 50.0, 41.0, 51.0, 41.0, 42.0, 40.0, 31.0, 34.0, 28.0, 32.0, 25.0, 30.0, 27.0, 28.0, 17.0, 20.0, 12.0, 11.0, 14.0, 4.0, 6.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.583984375, -2.501953125, -2.419921875, -2.337890625, -2.255859375, -2.173828125, -2.091796875, -2.009765625, -1.927734375, -1.845703125, -1.763671875, -1.681640625, -1.599609375, -1.517578125, -1.435546875, -1.353515625, -1.271484375, -1.189453125, -1.107421875, -1.025390625, -0.943359375, -0.861328125, -0.779296875, -0.697265625, -0.615234375, -0.533203125, -0.451171875, -0.369140625, -0.287109375, -0.205078125, -0.123046875, -0.041015625, 0.041015625, 0.123046875, 0.205078125, 0.287109375, 0.369140625, 0.451171875, 0.533203125, 0.615234375, 0.697265625, 0.779296875, 0.861328125, 0.943359375, 1.025390625, 1.107421875, 1.189453125, 1.271484375, 1.353515625, 1.435546875, 1.517578125, 1.599609375, 1.681640625, 1.763671875, 1.845703125, 1.927734375, 2.009765625, 2.091796875, 2.173828125, 2.255859375, 2.337890625, 2.419921875, 2.501953125, 2.583984375, 2.666015625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 13.0, 15.0, 14.0, 27.0, 37.0, 58.0, 100.0, 118.0, 205.0, 340.0, 502.0, 829.0, 1289.0, 1938.0, 3084.0, 4845.0, 7968.0, 13181.0, 23403.0, 46271.0, 124632.0, 474247.0, 210166.0, 63848.0, 29692.0, 16235.0, 9545.0, 5934.0, 3686.0, 2161.0, 1469.0, 944.0, 593.0, 425.0, 257.0, 151.0, 104.0, 75.0, 38.0, 37.0, 24.0, 14.0, 10.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.037109375, -2.938140869140625, -2.83917236328125, -2.740203857421875, -2.6412353515625, -2.542266845703125, -2.44329833984375, -2.344329833984375, -2.245361328125, -2.146392822265625, -2.04742431640625, -1.948455810546875, -1.8494873046875, -1.750518798828125, -1.65155029296875, -1.552581787109375, -1.45361328125, -1.354644775390625, -1.25567626953125, -1.156707763671875, -1.0577392578125, -0.958770751953125, -0.85980224609375, -0.760833740234375, -0.661865234375, -0.562896728515625, -0.46392822265625, -0.364959716796875, -0.2659912109375, -0.167022705078125, -0.06805419921875, 0.030914306640625, 0.1298828125, 0.228851318359375, 0.32781982421875, 0.426788330078125, 0.5257568359375, 0.624725341796875, 0.72369384765625, 0.822662353515625, 0.921630859375, 1.020599365234375, 1.11956787109375, 1.218536376953125, 1.3175048828125, 1.416473388671875, 1.51544189453125, 1.614410400390625, 1.71337890625, 1.812347412109375, 1.91131591796875, 2.010284423828125, 2.1092529296875, 2.208221435546875, 2.30718994140625, 2.406158447265625, 2.505126953125, 2.604095458984375, 2.70306396484375, 2.802032470703125, 2.9010009765625, 2.999969482421875, 3.09893798828125, 3.197906494140625, 3.296875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 3.0, 10.0, 12.0, 13.0, 16.0, 18.0, 14.0, 26.0, 23.0, 26.0, 30.0, 39.0, 36.0, 54.0, 53.0, 70.0, 112.0, 318.0, 1538.0, 145.0, 73.0, 58.0, 40.0, 44.0, 50.0, 35.0, 37.0, 28.0, 18.0, 8.0, 17.0, 15.0, 13.0, 9.0, 9.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.0546875, -9.7598876953125, -9.465087890625, -9.1702880859375, -8.87548828125, -8.5806884765625, -8.285888671875, -7.9910888671875, -7.6962890625, -7.4014892578125, -7.106689453125, -6.8118896484375, -6.51708984375, -6.2222900390625, -5.927490234375, -5.6326904296875, -5.337890625, -5.0430908203125, -4.748291015625, -4.4534912109375, -4.15869140625, -3.8638916015625, -3.569091796875, -3.2742919921875, -2.9794921875, -2.6846923828125, -2.389892578125, -2.0950927734375, -1.80029296875, -1.5054931640625, -1.210693359375, -0.9158935546875, -0.62109375, -0.3262939453125, -0.031494140625, 0.2633056640625, 0.55810546875, 0.8529052734375, 1.147705078125, 1.4425048828125, 1.7373046875, 2.0321044921875, 2.326904296875, 2.6217041015625, 2.91650390625, 3.2113037109375, 3.506103515625, 3.8009033203125, 4.095703125, 4.3905029296875, 4.685302734375, 4.9801025390625, 5.27490234375, 5.5697021484375, 5.864501953125, 6.1593017578125, 6.4541015625, 6.7489013671875, 7.043701171875, 7.3385009765625, 7.63330078125, 7.9281005859375, 8.222900390625, 8.5177001953125, 8.8125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 4.0, 13.0, 4.0, 10.0, 12.0, 15.0, 21.0, 21.0, 29.0, 36.0, 68.0, 69.0, 120.0, 143.0, 208.0, 569.0, 2147.0, 13325.0, 313276.0, 2772400.0, 37033.0, 4298.0, 918.0, 340.0, 173.0, 111.0, 80.0, 59.0, 44.0, 28.0, 25.0, 23.0, 13.0, 18.0, 13.0, 15.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.84375, -15.30126953125, -14.7587890625, -14.21630859375, -13.673828125, -13.13134765625, -12.5888671875, -12.04638671875, -11.50390625, -10.96142578125, -10.4189453125, -9.87646484375, -9.333984375, -8.79150390625, -8.2490234375, -7.70654296875, -7.1640625, -6.62158203125, -6.0791015625, -5.53662109375, -4.994140625, -4.45166015625, -3.9091796875, -3.36669921875, -2.82421875, -2.28173828125, -1.7392578125, -1.19677734375, -0.654296875, -0.11181640625, 0.4306640625, 0.97314453125, 1.515625, 2.05810546875, 2.6005859375, 3.14306640625, 3.685546875, 4.22802734375, 4.7705078125, 5.31298828125, 5.85546875, 6.39794921875, 6.9404296875, 7.48291015625, 8.025390625, 8.56787109375, 9.1103515625, 9.65283203125, 10.1953125, 10.73779296875, 11.2802734375, 11.82275390625, 12.365234375, 12.90771484375, 13.4501953125, 13.99267578125, 14.53515625, 15.07763671875, 15.6201171875, 16.16259765625, 16.705078125, 17.24755859375, 17.7900390625, 18.33251953125, 18.875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 43.0, 871.0, 101.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.74436378479004, -22.522239685058594, -16.30011749267578, -10.077993392944336, -3.8558692932128906, 2.3662548065185547, 8.588376998901367, 14.810503005981445, 21.032625198364258, 27.254749298095703, 33.476871490478516, 39.698997497558594, 45.921119689941406, 52.14324188232422, 58.36536407470703, 64.58749389648438, 70.80961608886719, 77.03173828125, 83.25386047363281, 89.47598266601562, 95.69811248779297, 101.92023468017578, 108.1423568725586, 114.36448669433594, 120.58660125732422, 126.80872344970703, 133.03085327148438, 139.2529754638672, 145.47509765625, 151.6972198486328, 157.91934204101562, 164.14146423339844, 170.3636016845703, 176.58572387695312, 182.80784606933594, 189.02996826171875, 195.25209045410156, 201.47421264648438, 207.69635009765625, 213.91847229003906, 220.14059448242188, 226.3627166748047, 232.5848388671875, 238.8069610595703, 245.02908325195312, 251.251220703125, 257.47332763671875, 263.6954650878906, 269.9175720214844, 276.13970947265625, 282.36181640625, 288.5839538574219, 294.8060607910156, 301.0281982421875, 307.25030517578125, 313.4724426269531, 319.694580078125, 325.9167175292969, 332.1388244628906, 338.3609619140625, 344.58306884765625, 350.8052062988281, 357.0273132324219, 363.24945068359375, 369.4715576171875]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 10.0, 5.0, 10.0, 21.0, 15.0, 19.0, 25.0, 23.0, 18.0, 35.0, 33.0, 33.0, 39.0, 38.0, 38.0, 43.0, 51.0, 39.0, 43.0, 39.0, 30.0, 34.0, 30.0, 41.0, 44.0, 30.0, 21.0, 22.0, 26.0, 11.0, 16.0, 9.0, 17.0, 14.0, 12.0, 6.0, 12.0, 12.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.224456787109375, -23.472850799560547, -22.721242904663086, -21.969636917114258, -21.21803092956543, -20.46642303466797, -19.71481704711914, -18.963211059570312, -18.211605072021484, -17.459999084472656, -16.708391189575195, -15.956785202026367, -15.205179214477539, -14.453572273254395, -13.70196533203125, -12.950359344482422, -12.198751449584961, -11.447144508361816, -10.695538520812988, -9.943931579589844, -9.192325592041016, -8.440718650817871, -7.689111709594727, -6.93750524520874, -6.185898780822754, -5.434292316436768, -4.682685852050781, -3.9310789108276367, -3.1794724464416504, -2.427865982055664, -1.6762590408325195, -0.9246525764465332, -0.17304611206054688, 0.578560471534729, 1.3301670551300049, 2.0817737579345703, 2.8333802223205566, 3.584986686706543, 4.3365936279296875, 5.088200092315674, 5.83980655670166, 6.5914130210876465, 7.343019485473633, 8.094626426696777, 8.846233367919922, 9.59783935546875, 10.349446296691895, 11.101053237915039, 11.852659225463867, 12.604266166687012, 13.35587215423584, 14.107479095458984, 14.859085083007812, 15.610692024230957, 16.3622989654541, 17.11390495300293, 17.86551284790039, 18.61711883544922, 19.36872673034668, 20.120332717895508, 20.871938705444336, 21.623546600341797, 22.375152587890625, 23.126758575439453, 23.87836456298828]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 9.0, 12.0, 8.0, 18.0, 15.0, 20.0, 22.0, 20.0, 19.0, 31.0, 30.0, 36.0, 41.0, 42.0, 45.0, 34.0, 52.0, 39.0, 49.0, 43.0, 44.0, 36.0, 35.0, 35.0, 19.0, 34.0, 37.0, 26.0, 23.0, 20.0, 18.0, 19.0, 14.0, 10.0, 7.0, 5.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.78125, -2.6942138671875, -2.607177734375, -2.5201416015625, -2.43310546875, -2.3460693359375, -2.259033203125, -2.1719970703125, -2.0849609375, -1.9979248046875, -1.910888671875, -1.8238525390625, -1.73681640625, -1.6497802734375, -1.562744140625, -1.4757080078125, -1.388671875, -1.3016357421875, -1.214599609375, -1.1275634765625, -1.04052734375, -0.9534912109375, -0.866455078125, -0.7794189453125, -0.6923828125, -0.6053466796875, -0.518310546875, -0.4312744140625, -0.34423828125, -0.2572021484375, -0.170166015625, -0.0831298828125, 0.00390625, 0.0909423828125, 0.177978515625, 0.2650146484375, 0.35205078125, 0.4390869140625, 0.526123046875, 0.6131591796875, 0.7001953125, 0.7872314453125, 0.874267578125, 0.9613037109375, 1.04833984375, 1.1353759765625, 1.222412109375, 1.3094482421875, 1.396484375, 1.4835205078125, 1.570556640625, 1.6575927734375, 1.74462890625, 1.8316650390625, 1.918701171875, 2.0057373046875, 2.0927734375, 2.1798095703125, 2.266845703125, 2.3538818359375, 2.44091796875, 2.5279541015625, 2.614990234375, 2.7020263671875, 2.7890625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 10.0, 6.0, 8.0, 9.0, 11.0, 22.0, 23.0, 22.0, 31.0, 53.0, 83.0, 164.0, 287.0, 593.0, 1501.0, 4618.0, 18167.0, 100153.0, 1038429.0, 2723222.0, 255990.0, 38114.0, 8410.0, 2506.0, 928.0, 375.0, 180.0, 90.0, 71.0, 56.0, 37.0, 41.0, 14.0, 11.0, 13.0, 10.0, 5.0, 7.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9375, -8.641845703125, -8.34619140625, -8.050537109375, -7.7548828125, -7.459228515625, -7.16357421875, -6.867919921875, -6.572265625, -6.276611328125, -5.98095703125, -5.685302734375, -5.3896484375, -5.093994140625, -4.79833984375, -4.502685546875, -4.20703125, -3.911376953125, -3.61572265625, -3.320068359375, -3.0244140625, -2.728759765625, -2.43310546875, -2.137451171875, -1.841796875, -1.546142578125, -1.25048828125, -0.954833984375, -0.6591796875, -0.363525390625, -0.06787109375, 0.227783203125, 0.5234375, 0.819091796875, 1.11474609375, 1.410400390625, 1.7060546875, 2.001708984375, 2.29736328125, 2.593017578125, 2.888671875, 3.184326171875, 3.47998046875, 3.775634765625, 4.0712890625, 4.366943359375, 4.66259765625, 4.958251953125, 5.25390625, 5.549560546875, 5.84521484375, 6.140869140625, 6.4365234375, 6.732177734375, 7.02783203125, 7.323486328125, 7.619140625, 7.914794921875, 8.21044921875, 8.506103515625, 8.8017578125, 9.097412109375, 9.39306640625, 9.688720703125, 9.984375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 12.0, 14.0, 18.0, 22.0, 52.0, 77.0, 103.0, 173.0, 285.0, 426.0, 600.0, 707.0, 548.0, 352.0, 221.0, 146.0, 102.0, 56.0, 41.0, 33.0, 32.0, 18.0, 6.0, 8.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8984375, -9.6011962890625, -9.303955078125, -9.0067138671875, -8.70947265625, -8.4122314453125, -8.114990234375, -7.8177490234375, -7.5205078125, -7.2232666015625, -6.926025390625, -6.6287841796875, -6.33154296875, -6.0343017578125, -5.737060546875, -5.4398193359375, -5.142578125, -4.8453369140625, -4.548095703125, -4.2508544921875, -3.95361328125, -3.6563720703125, -3.359130859375, -3.0618896484375, -2.7646484375, -2.4674072265625, -2.170166015625, -1.8729248046875, -1.57568359375, -1.2784423828125, -0.981201171875, -0.6839599609375, -0.38671875, -0.0894775390625, 0.207763671875, 0.5050048828125, 0.80224609375, 1.0994873046875, 1.396728515625, 1.6939697265625, 1.9912109375, 2.2884521484375, 2.585693359375, 2.8829345703125, 3.18017578125, 3.4774169921875, 3.774658203125, 4.0718994140625, 4.369140625, 4.6663818359375, 4.963623046875, 5.2608642578125, 5.55810546875, 5.8553466796875, 6.152587890625, 6.4498291015625, 6.7470703125, 7.0443115234375, 7.341552734375, 7.6387939453125, 7.93603515625, 8.2332763671875, 8.530517578125, 8.8277587890625, 9.125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 12.0, 9.0, 14.0, 30.0, 53.0, 83.0, 137.0, 296.0, 618.0, 1816.0, 10091.0, 137242.0, 3285598.0, 721212.0, 31559.0, 3744.0, 974.0, 385.0, 180.0, 89.0, 49.0, 35.0, 21.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.556396484375, -20.83154296875, -20.106689453125, -19.3818359375, -18.656982421875, -17.93212890625, -17.207275390625, -16.482421875, -15.757568359375, -15.03271484375, -14.307861328125, -13.5830078125, -12.858154296875, -12.13330078125, -11.408447265625, -10.68359375, -9.958740234375, -9.23388671875, -8.509033203125, -7.7841796875, -7.059326171875, -6.33447265625, -5.609619140625, -4.884765625, -4.159912109375, -3.43505859375, -2.710205078125, -1.9853515625, -1.260498046875, -0.53564453125, 0.189208984375, 0.9140625, 1.638916015625, 2.36376953125, 3.088623046875, 3.8134765625, 4.538330078125, 5.26318359375, 5.988037109375, 6.712890625, 7.437744140625, 8.16259765625, 8.887451171875, 9.6123046875, 10.337158203125, 11.06201171875, 11.786865234375, 12.51171875, 13.236572265625, 13.96142578125, 14.686279296875, 15.4111328125, 16.135986328125, 16.86083984375, 17.585693359375, 18.310546875, 19.035400390625, 19.76025390625, 20.485107421875, 21.2099609375, 21.934814453125, 22.65966796875, 23.384521484375, 24.109375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 18.0, 22.0, 39.0, 55.0, 87.0, 110.0, 118.0, 117.0, 103.0, 100.0, 64.0, 49.0, 36.0, 23.0, 21.0, 12.0, 9.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.61042785644531, -42.1127815246582, -40.615135192871094, -39.11749267578125, -37.61984634399414, -36.12220001220703, -34.62455749511719, -33.12691116333008, -31.62926483154297, -30.13161849975586, -28.633974075317383, -27.136329650878906, -25.638683319091797, -24.141036987304688, -22.64339256286621, -21.145748138427734, -19.648101806640625, -18.150455474853516, -16.65281105041504, -15.155165672302246, -13.657520294189453, -12.15987491607666, -10.662229537963867, -9.164584159851074, -7.666938781738281, -6.169293403625488, -4.671648025512695, -3.1740026473999023, -1.6763572692871094, -0.1787118911743164, 1.3189334869384766, 2.8165788650512695, 4.3142242431640625, 5.8118696212768555, 7.309514999389648, 8.807160377502441, 10.304805755615234, 11.802451133728027, 13.30009651184082, 14.797741889953613, 16.295387268066406, 17.793033599853516, 19.290678024291992, 20.78832244873047, 22.285968780517578, 23.783615112304688, 25.281259536743164, 26.77890396118164, 28.27655029296875, 29.77419662475586, 31.271841049194336, 32.76948547363281, 34.26713180541992, 35.76477813720703, 37.262420654296875, 38.760066986083984, 40.257713317871094, 41.7553596496582, 43.25300598144531, 44.750648498535156, 46.248294830322266, 47.745941162109375, 49.24358367919922, 50.74123001098633, 52.23887634277344]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 4.0, 6.0, 9.0, 14.0, 16.0, 18.0, 18.0, 22.0, 24.0, 33.0, 32.0, 44.0, 47.0, 54.0, 43.0, 30.0, 40.0, 43.0, 43.0, 42.0, 40.0, 47.0, 39.0, 47.0, 48.0, 28.0, 23.0, 25.0, 26.0, 16.0, 15.0, 17.0, 5.0, 15.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.645713806152344, -28.773040771484375, -27.900367736816406, -27.027694702148438, -26.155019760131836, -25.282346725463867, -24.4096736907959, -23.53700065612793, -22.664325714111328, -21.79165267944336, -20.91897964477539, -20.046306610107422, -19.17363166809082, -18.30095863342285, -17.428285598754883, -16.555612564086914, -15.682939529418945, -14.810266494750977, -13.937592506408691, -13.064919471740723, -12.192245483398438, -11.319572448730469, -10.4468994140625, -9.574226379394531, -8.701552391052246, -7.828878879547119, -6.956205368041992, -6.083532333374023, -5.2108588218688965, -4.3381853103637695, -3.465512275695801, -2.592838764190674, -1.7201652526855469, -0.8474918603897095, 0.02518153190612793, 0.8978548049926758, 1.7705283164978027, 2.6432018280029297, 3.5158748626708984, 4.388548374176025, 5.261221885681152, 6.133895397186279, 7.006568908691406, 7.879241943359375, 8.751914978027344, 9.624588966369629, 10.497262001037598, 11.369935989379883, 12.242609024047852, 13.11528205871582, 13.987956047058105, 14.860629081726074, 15.73330307006836, 16.605976104736328, 17.478649139404297, 18.351322174072266, 19.223995208740234, 20.096668243408203, 20.969341278076172, 21.84201431274414, 22.714689254760742, 23.58736228942871, 24.46003532409668, 25.33270835876465, 26.20538330078125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 18.0, 19.0, 12.0, 20.0, 24.0, 19.0, 25.0, 33.0, 40.0, 34.0, 39.0, 39.0, 30.0, 47.0, 45.0, 55.0, 37.0, 40.0, 35.0, 36.0, 38.0, 27.0, 29.0, 30.0, 31.0, 31.0, 22.0, 15.0, 15.0, 12.0, 21.0, 9.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.626953125, -2.540802001953125, -2.45465087890625, -2.368499755859375, -2.2823486328125, -2.196197509765625, -2.11004638671875, -2.023895263671875, -1.937744140625, -1.851593017578125, -1.76544189453125, -1.679290771484375, -1.5931396484375, -1.506988525390625, -1.42083740234375, -1.334686279296875, -1.24853515625, -1.162384033203125, -1.07623291015625, -0.990081787109375, -0.9039306640625, -0.817779541015625, -0.73162841796875, -0.645477294921875, -0.559326171875, -0.473175048828125, -0.38702392578125, -0.300872802734375, -0.2147216796875, -0.128570556640625, -0.04241943359375, 0.043731689453125, 0.1298828125, 0.216033935546875, 0.30218505859375, 0.388336181640625, 0.4744873046875, 0.560638427734375, 0.64678955078125, 0.732940673828125, 0.819091796875, 0.905242919921875, 0.99139404296875, 1.077545166015625, 1.1636962890625, 1.249847412109375, 1.33599853515625, 1.422149658203125, 1.50830078125, 1.594451904296875, 1.68060302734375, 1.766754150390625, 1.8529052734375, 1.939056396484375, 2.02520751953125, 2.111358642578125, 2.197509765625, 2.283660888671875, 2.36981201171875, 2.455963134765625, 2.5421142578125, 2.628265380859375, 2.71441650390625, 2.800567626953125, 2.88671875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 15.0, 16.0, 41.0, 43.0, 83.0, 107.0, 156.0, 240.0, 355.0, 505.0, 753.0, 1163.0, 1625.0, 2499.0, 3716.0, 5488.0, 8395.0, 12318.0, 18924.0, 29539.0, 47008.0, 78012.0, 152180.0, 344027.0, 140292.0, 74134.0, 44568.0, 27995.0, 18364.0, 11910.0, 7865.0, 5309.0, 3502.0, 2317.0, 1577.0, 1096.0, 733.0, 491.0, 356.0, 263.0, 171.0, 109.0, 98.0, 47.0, 49.0, 24.0, 25.0, 9.0, 11.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.206298828125, -0.19952392578125, -0.1927490234375, -0.18597412109375, -0.17919921875, -0.17242431640625, -0.1656494140625, -0.15887451171875, -0.152099609375, -0.14532470703125, -0.1385498046875, -0.13177490234375, -0.125, -0.11822509765625, -0.1114501953125, -0.10467529296875, -0.097900390625, -0.09112548828125, -0.0843505859375, -0.07757568359375, -0.07080078125, -0.06402587890625, -0.0572509765625, -0.05047607421875, -0.043701171875, -0.03692626953125, -0.0301513671875, -0.02337646484375, -0.0166015625, -0.00982666015625, -0.0030517578125, 0.00372314453125, 0.010498046875, 0.01727294921875, 0.0240478515625, 0.03082275390625, 0.03759765625, 0.04437255859375, 0.0511474609375, 0.05792236328125, 0.064697265625, 0.07147216796875, 0.0782470703125, 0.08502197265625, 0.091796875, 0.09857177734375, 0.1053466796875, 0.11212158203125, 0.118896484375, 0.12567138671875, 0.1324462890625, 0.13922119140625, 0.14599609375, 0.15277099609375, 0.1595458984375, 0.16632080078125, 0.173095703125, 0.17987060546875, 0.1866455078125, 0.19342041015625, 0.2001953125, 0.20697021484375, 0.2137451171875, 0.22052001953125, 0.227294921875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 9.0, 7.0, 12.0, 17.0, 16.0, 22.0, 30.0, 22.0, 24.0, 23.0, 42.0, 36.0, 31.0, 25.0, 39.0, 41.0, 32.0, 37.0, 1067.0, 47.0, 40.0, 32.0, 38.0, 39.0, 32.0, 31.0, 40.0, 19.0, 26.0, 19.0, 21.0, 18.0, 13.0, 14.0, 6.0, 13.0, 10.0, 4.0, 7.0, 8.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0], "bins": [-2.11328125, -2.051971435546875, -1.99066162109375, -1.929351806640625, -1.8680419921875, -1.806732177734375, -1.74542236328125, -1.684112548828125, -1.622802734375, -1.561492919921875, -1.50018310546875, -1.438873291015625, -1.3775634765625, -1.316253662109375, -1.25494384765625, -1.193634033203125, -1.13232421875, -1.071014404296875, -1.00970458984375, -0.948394775390625, -0.8870849609375, -0.825775146484375, -0.76446533203125, -0.703155517578125, -0.641845703125, -0.580535888671875, -0.51922607421875, -0.457916259765625, -0.3966064453125, -0.335296630859375, -0.27398681640625, -0.212677001953125, -0.1513671875, -0.090057373046875, -0.02874755859375, 0.032562255859375, 0.0938720703125, 0.155181884765625, 0.21649169921875, 0.277801513671875, 0.339111328125, 0.400421142578125, 0.46173095703125, 0.523040771484375, 0.5843505859375, 0.645660400390625, 0.70697021484375, 0.768280029296875, 0.82958984375, 0.890899658203125, 0.95220947265625, 1.013519287109375, 1.0748291015625, 1.136138916015625, 1.19744873046875, 1.258758544921875, 1.320068359375, 1.381378173828125, 1.44268798828125, 1.503997802734375, 1.5653076171875, 1.626617431640625, 1.68792724609375, 1.749237060546875, 1.810546875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 6.0, 5.0, 10.0, 17.0, 13.0, 17.0, 43.0, 51.0, 77.0, 117.0, 147.0, 204.0, 352.0, 431.0, 708.0, 990.0, 1523.0, 2295.0, 3481.0, 5422.0, 8597.0, 13708.0, 22694.0, 38873.0, 69873.0, 138176.0, 1419617.0, 174072.0, 81604.0, 44542.0, 26234.0, 15725.0, 9792.0, 6123.0, 3863.0, 2586.0, 1662.0, 1149.0, 686.0, 500.0, 336.0, 276.0, 152.0, 120.0, 84.0, 53.0, 41.0, 29.0, 16.0, 13.0, 14.0, 11.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11824512481689453, -0.11411476135253906, -0.1099843978881836, -0.10585403442382812, -0.10172367095947266, -0.09759330749511719, -0.09346294403076172, -0.08933258056640625, -0.08520221710205078, -0.08107185363769531, -0.07694149017333984, -0.07281112670898438, -0.0686807632446289, -0.06455039978027344, -0.06042003631591797, -0.0562896728515625, -0.05215930938720703, -0.04802894592285156, -0.043898582458496094, -0.039768218994140625, -0.035637855529785156, -0.03150749206542969, -0.02737712860107422, -0.02324676513671875, -0.01911640167236328, -0.014986038208007812, -0.010855674743652344, -0.006725311279296875, -0.0025949478149414062, 0.0015354156494140625, 0.005665779113769531, 0.009796142578125, 0.013926506042480469, 0.018056869506835938, 0.022187232971191406, 0.026317596435546875, 0.030447959899902344, 0.03457832336425781, 0.03870868682861328, 0.04283905029296875, 0.04696941375732422, 0.05109977722167969, 0.055230140686035156, 0.059360504150390625, 0.0634908676147461, 0.06762123107910156, 0.07175159454345703, 0.0758819580078125, 0.08001232147216797, 0.08414268493652344, 0.0882730484008789, 0.09240341186523438, 0.09653377532958984, 0.10066413879394531, 0.10479450225830078, 0.10892486572265625, 0.11305522918701172, 0.11718559265136719, 0.12131595611572266, 0.12544631958007812, 0.1295766830444336, 0.13370704650878906, 0.13783740997314453, 0.1419677734375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 3.0, 7.0, 12.0, 12.0, 20.0, 23.0, 28.0, 28.0, 55.0, 63.0, 100.0, 113.0, 137.0, 83.0, 73.0, 64.0, 31.0, 47.0, 24.0, 13.0, 11.0, 11.0, 7.0, 1.0, 6.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2934207916259766e-05, -1.2519769370555878e-05, -1.210533082485199e-05, -1.1690892279148102e-05, -1.1276453733444214e-05, -1.0862015187740326e-05, -1.0447576642036438e-05, -1.003313809633255e-05, -9.618699550628662e-06, -9.204261004924774e-06, -8.789822459220886e-06, -8.375383913516998e-06, -7.96094536781311e-06, -7.546506822109222e-06, -7.1320682764053345e-06, -6.7176297307014465e-06, -6.303191184997559e-06, -5.888752639293671e-06, -5.474314093589783e-06, -5.059875547885895e-06, -4.645437002182007e-06, -4.230998456478119e-06, -3.816559910774231e-06, -3.402121365070343e-06, -2.987682819366455e-06, -2.573244273662567e-06, -2.158805727958679e-06, -1.7443671822547913e-06, -1.3299286365509033e-06, -9.154900908470154e-07, -5.010515451431274e-07, -8.66129994392395e-08, 3.2782554626464844e-07, 7.422640919685364e-07, 1.1567026376724243e-06, 1.5711411833763123e-06, 1.9855797290802e-06, 2.400018274784088e-06, 2.814456820487976e-06, 3.228895366191864e-06, 3.643333911895752e-06, 4.05777245759964e-06, 4.472211003303528e-06, 4.886649549007416e-06, 5.301088094711304e-06, 5.715526640415192e-06, 6.12996518611908e-06, 6.5444037318229675e-06, 6.9588422775268555e-06, 7.373280823230743e-06, 7.787719368934631e-06, 8.20215791463852e-06, 8.616596460342407e-06, 9.031035006046295e-06, 9.445473551750183e-06, 9.859912097454071e-06, 1.0274350643157959e-05, 1.0688789188861847e-05, 1.1103227734565735e-05, 1.1517666280269623e-05, 1.193210482597351e-05, 1.2346543371677399e-05, 1.2760981917381287e-05, 1.3175420463085175e-05, 1.3589859008789062e-05]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 6.0, 9.0, 14.0, 16.0, 9.0, 31.0, 44.0, 67.0, 138.0, 255.0, 500.0, 1430.0, 4522.0, 19709.0, 124383.0, 756246.0, 115630.0, 18713.0, 4337.0, 1415.0, 511.0, 216.0, 116.0, 60.0, 44.0, 25.0, 22.0, 17.0, 16.0, 12.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018322467803955078, -0.00017775222659111023, -0.00017227977514266968, -0.00016680732369422913, -0.00016133487224578857, -0.00015586242079734802, -0.00015038996934890747, -0.00014491751790046692, -0.00013944506645202637, -0.00013397261500358582, -0.00012850016355514526, -0.0001230277121067047, -0.00011755526065826416, -0.00011208280920982361, -0.00010661035776138306, -0.0001011379063129425, -9.566545486450195e-05, -9.01930034160614e-05, -8.472055196762085e-05, -7.92481005191803e-05, -7.377564907073975e-05, -6.83031976222992e-05, -6.283074617385864e-05, -5.735829472541809e-05, -5.188584327697754e-05, -4.641339182853699e-05, -4.0940940380096436e-05, -3.5468488931655884e-05, -2.9996037483215332e-05, -2.452358603477478e-05, -1.905113458633423e-05, -1.3578683137893677e-05, -8.106231689453125e-06, -2.6337802410125732e-06, 2.8386712074279785e-06, 8.31112265586853e-06, 1.3783574104309082e-05, 1.9256025552749634e-05, 2.4728477001190186e-05, 3.0200928449630737e-05, 3.567337989807129e-05, 4.114583134651184e-05, 4.661828279495239e-05, 5.2090734243392944e-05, 5.7563185691833496e-05, 6.303563714027405e-05, 6.85080885887146e-05, 7.398054003715515e-05, 7.94529914855957e-05, 8.492544293403625e-05, 9.03978943824768e-05, 9.587034583091736e-05, 0.00010134279727935791, 0.00010681524872779846, 0.00011228770017623901, 0.00011776015162467957, 0.00012323260307312012, 0.00012870505452156067, 0.00013417750597000122, 0.00013964995741844177, 0.00014512240886688232, 0.00015059486031532288, 0.00015606731176376343, 0.00016153976321220398, 0.00016701221466064453]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 12.0, 27.0, 51.0, 84.0, 189.0, 252.0, 195.0, 103.0, 49.0, 23.0, 10.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9928738008020446e-05, -4.88556943309959e-05, -4.7782654291950166e-05, -4.670961061492562e-05, -4.563656693790108e-05, -4.4563523260876536e-05, -4.349047958385199e-05, -4.241743954480626e-05, -4.1344395867781714e-05, -4.027135219075717e-05, -3.9198312151711434e-05, -3.812526847468689e-05, -3.705222479766235e-05, -3.5979181120637804e-05, -3.490613744361326e-05, -3.3833097404567525e-05, -3.276005372754298e-05, -3.168701005051844e-05, -3.06139700114727e-05, -2.954092633444816e-05, -2.8467882657423615e-05, -2.7394838980399072e-05, -2.6321797122363932e-05, -2.5248755264328793e-05, -2.417571158730425e-05, -2.3102667910279706e-05, -2.2029626052244566e-05, -2.0956584194209427e-05, -1.9883540517184883e-05, -1.881049684016034e-05, -1.77374549821252e-05, -1.666441312409006e-05, -1.559136580908671e-05, -1.4518323041556869e-05, -1.3445280274027027e-05, -1.2372237506497186e-05, -1.1299194738967344e-05, -1.0226151971437503e-05, -9.153109203907661e-06, -8.08006643637782e-06, -7.007023668847978e-06, -5.933980901318137e-06, -4.860938133788295e-06, -3.7878953662584536e-06, -2.714852598728612e-06, -1.6418098311987706e-06, -5.68767063668929e-07, 5.042757038609125e-07, 1.577318471390754e-06, 2.6503612389205955e-06, 3.723404006450437e-06, 4.7964467739802785e-06, 5.86948954151012e-06, 6.9425323090399615e-06, 8.015575076569803e-06, 9.088617844099645e-06, 1.0161660611629486e-05, 1.1234703379159328e-05, 1.2307746146689169e-05, 1.338078891421901e-05, 1.4453831681748852e-05, 1.5526875358773395e-05, 1.6599917216808535e-05, 1.7672959074843675e-05, 1.8746002751868218e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 1.0, 10.0, 9.0, 9.0, 21.0, 7.0, 33.0, 21.0, 32.0, 28.0, 16.0, 29.0, 21.0, 37.0, 44.0, 22.0, 44.0, 26.0, 44.0, 24.0, 44.0, 51.0, 28.0, 31.0, 30.0, 38.0, 25.0, 36.0, 43.0, 20.0, 27.0, 18.0, 26.0, 20.0, 13.0, 15.0, 7.0, 6.0, 7.0, 7.0, 8.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.708766937255859e-06, -4.555098712444305e-06, -4.4014304876327515e-06, -4.2477622628211975e-06, -4.0940940380096436e-06, -3.94042581319809e-06, -3.7867575883865356e-06, -3.6330893635749817e-06, -3.4794211387634277e-06, -3.3257529139518738e-06, -3.17208468914032e-06, -3.018416464328766e-06, -2.864748239517212e-06, -2.711080014705658e-06, -2.557411789894104e-06, -2.40374356508255e-06, -2.250075340270996e-06, -2.096407115459442e-06, -1.942738890647888e-06, -1.7890706658363342e-06, -1.6354024410247803e-06, -1.4817342162132263e-06, -1.3280659914016724e-06, -1.1743977665901184e-06, -1.0207295417785645e-06, -8.670613169670105e-07, -7.133930921554565e-07, -5.597248673439026e-07, -4.0605664253234863e-07, -2.523884177207947e-07, -9.872019290924072e-08, 5.494803190231323e-08, 2.086162567138672e-07, 3.6228448152542114e-07, 5.159527063369751e-07, 6.69620931148529e-07, 8.23289155960083e-07, 9.76957380771637e-07, 1.130625605583191e-06, 1.2842938303947449e-06, 1.4379620552062988e-06, 1.5916302800178528e-06, 1.7452985048294067e-06, 1.8989667296409607e-06, 2.0526349544525146e-06, 2.2063031792640686e-06, 2.3599714040756226e-06, 2.5136396288871765e-06, 2.6673078536987305e-06, 2.8209760785102844e-06, 2.9746443033218384e-06, 3.1283125281333923e-06, 3.2819807529449463e-06, 3.4356489777565002e-06, 3.589317202568054e-06, 3.742985427379608e-06, 3.896653652191162e-06, 4.050321877002716e-06, 4.20399010181427e-06, 4.357658326625824e-06, 4.511326551437378e-06, 4.664994776248932e-06, 4.818663001060486e-06, 4.97233122587204e-06, 5.125999450683594e-06]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 18.0, 19.0, 12.0, 20.0, 24.0, 19.0, 25.0, 33.0, 40.0, 34.0, 39.0, 39.0, 30.0, 47.0, 45.0, 55.0, 37.0, 40.0, 35.0, 36.0, 38.0, 27.0, 29.0, 30.0, 31.0, 31.0, 22.0, 15.0, 15.0, 12.0, 21.0, 9.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.626953125, -2.540802001953125, -2.45465087890625, -2.368499755859375, -2.2823486328125, -2.196197509765625, -2.11004638671875, -2.023895263671875, -1.937744140625, -1.851593017578125, -1.76544189453125, -1.679290771484375, -1.5931396484375, -1.506988525390625, -1.42083740234375, -1.334686279296875, -1.24853515625, -1.162384033203125, -1.07623291015625, -0.990081787109375, -0.9039306640625, -0.817779541015625, -0.73162841796875, -0.645477294921875, -0.559326171875, -0.473175048828125, -0.38702392578125, -0.300872802734375, -0.2147216796875, -0.128570556640625, -0.04241943359375, 0.043731689453125, 0.1298828125, 0.216033935546875, 0.30218505859375, 0.388336181640625, 0.4744873046875, 0.560638427734375, 0.64678955078125, 0.732940673828125, 0.819091796875, 0.905242919921875, 0.99139404296875, 1.077545166015625, 1.1636962890625, 1.249847412109375, 1.33599853515625, 1.422149658203125, 1.50830078125, 1.594451904296875, 1.68060302734375, 1.766754150390625, 1.8529052734375, 1.939056396484375, 2.02520751953125, 2.111358642578125, 2.197509765625, 2.283660888671875, 2.36981201171875, 2.455963134765625, 2.5421142578125, 2.628265380859375, 2.71441650390625, 2.800567626953125, 2.88671875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 18.0, 21.0, 19.0, 35.0, 56.0, 92.0, 125.0, 204.0, 313.0, 436.0, 725.0, 1208.0, 1871.0, 2919.0, 4587.0, 7189.0, 11832.0, 19896.0, 37472.0, 85007.0, 270999.0, 388834.0, 109909.0, 45450.0, 23305.0, 13557.0, 8377.0, 5000.0, 3232.0, 2130.0, 1358.0, 866.0, 534.0, 340.0, 249.0, 144.0, 70.0, 75.0, 30.0, 33.0, 18.0, 6.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.841796875, -2.75335693359375, -2.6649169921875, -2.57647705078125, -2.488037109375, -2.39959716796875, -2.3111572265625, -2.22271728515625, -2.13427734375, -2.04583740234375, -1.9573974609375, -1.86895751953125, -1.780517578125, -1.69207763671875, -1.6036376953125, -1.51519775390625, -1.4267578125, -1.33831787109375, -1.2498779296875, -1.16143798828125, -1.072998046875, -0.98455810546875, -0.8961181640625, -0.80767822265625, -0.71923828125, -0.63079833984375, -0.5423583984375, -0.45391845703125, -0.365478515625, -0.27703857421875, -0.1885986328125, -0.10015869140625, -0.01171875, 0.07672119140625, 0.1651611328125, 0.25360107421875, 0.342041015625, 0.43048095703125, 0.5189208984375, 0.60736083984375, 0.69580078125, 0.78424072265625, 0.8726806640625, 0.96112060546875, 1.049560546875, 1.13800048828125, 1.2264404296875, 1.31488037109375, 1.4033203125, 1.49176025390625, 1.5802001953125, 1.66864013671875, 1.757080078125, 1.84552001953125, 1.9339599609375, 2.02239990234375, 2.11083984375, 2.19927978515625, 2.2877197265625, 2.37615966796875, 2.464599609375, 2.55303955078125, 2.6414794921875, 2.72991943359375, 2.818359375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 4.0, 7.0, 9.0, 13.0, 9.0, 11.0, 12.0, 13.0, 24.0, 32.0, 32.0, 31.0, 32.0, 31.0, 44.0, 65.0, 51.0, 86.0, 173.0, 1595.0, 232.0, 106.0, 70.0, 50.0, 52.0, 39.0, 37.0, 33.0, 18.0, 26.0, 19.0, 17.0, 18.0, 25.0, 12.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.0, -11.65380859375, -11.3076171875, -10.96142578125, -10.615234375, -10.26904296875, -9.9228515625, -9.57666015625, -9.23046875, -8.88427734375, -8.5380859375, -8.19189453125, -7.845703125, -7.49951171875, -7.1533203125, -6.80712890625, -6.4609375, -6.11474609375, -5.7685546875, -5.42236328125, -5.076171875, -4.72998046875, -4.3837890625, -4.03759765625, -3.69140625, -3.34521484375, -2.9990234375, -2.65283203125, -2.306640625, -1.96044921875, -1.6142578125, -1.26806640625, -0.921875, -0.57568359375, -0.2294921875, 0.11669921875, 0.462890625, 0.80908203125, 1.1552734375, 1.50146484375, 1.84765625, 2.19384765625, 2.5400390625, 2.88623046875, 3.232421875, 3.57861328125, 3.9248046875, 4.27099609375, 4.6171875, 4.96337890625, 5.3095703125, 5.65576171875, 6.001953125, 6.34814453125, 6.6943359375, 7.04052734375, 7.38671875, 7.73291015625, 8.0791015625, 8.42529296875, 8.771484375, 9.11767578125, 9.4638671875, 9.81005859375, 10.15625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 9.0, 13.0, 17.0, 20.0, 22.0, 38.0, 30.0, 35.0, 44.0, 75.0, 113.0, 137.0, 233.0, 477.0, 1237.0, 5685.0, 41382.0, 2380887.0, 681204.0, 27621.0, 4182.0, 1028.0, 392.0, 220.0, 154.0, 88.0, 74.0, 65.0, 48.0, 37.0, 28.0, 25.0, 14.0, 16.0, 10.0, 10.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.240966796875, -16.70068359375, -16.160400390625, -15.6201171875, -15.079833984375, -14.53955078125, -13.999267578125, -13.458984375, -12.918701171875, -12.37841796875, -11.838134765625, -11.2978515625, -10.757568359375, -10.21728515625, -9.677001953125, -9.13671875, -8.596435546875, -8.05615234375, -7.515869140625, -6.9755859375, -6.435302734375, -5.89501953125, -5.354736328125, -4.814453125, -4.274169921875, -3.73388671875, -3.193603515625, -2.6533203125, -2.113037109375, -1.57275390625, -1.032470703125, -0.4921875, 0.048095703125, 0.58837890625, 1.128662109375, 1.6689453125, 2.209228515625, 2.74951171875, 3.289794921875, 3.830078125, 4.370361328125, 4.91064453125, 5.450927734375, 5.9912109375, 6.531494140625, 7.07177734375, 7.612060546875, 8.15234375, 8.692626953125, 9.23291015625, 9.773193359375, 10.3134765625, 10.853759765625, 11.39404296875, 11.934326171875, 12.474609375, 13.014892578125, 13.55517578125, 14.095458984375, 14.6357421875, 15.176025390625, 15.71630859375, 16.256591796875, 16.796875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 33.0, 58.0, 127.0, 194.0, 232.0, 183.0, 107.0, 43.0, 18.0, 6.0, 2.0, 3.0], "bins": [-77.05413055419922, -75.68666076660156, -74.3191909790039, -72.95172119140625, -71.5842514038086, -70.21678161621094, -68.84931182861328, -67.48184204101562, -66.11437225341797, -64.74690246582031, -63.379432678222656, -62.011962890625, -60.644493103027344, -59.27702331542969, -57.90955352783203, -56.542083740234375, -55.174617767333984, -53.80714797973633, -52.43967819213867, -51.072208404541016, -49.70473861694336, -48.3372688293457, -46.96980285644531, -45.602333068847656, -44.23486328125, -42.867393493652344, -41.49992370605469, -40.13245391845703, -38.764984130859375, -37.39751434326172, -36.03004455566406, -34.662574768066406, -33.29510498046875, -31.927635192871094, -30.560165405273438, -29.19269561767578, -27.825225830078125, -26.45775604248047, -25.090288162231445, -23.72281837463379, -22.355348587036133, -20.987878799438477, -19.62040901184082, -18.252941131591797, -16.88547134399414, -15.518000602722168, -14.150531768798828, -12.783061981201172, -11.415592193603516, -10.04812240600586, -8.680652618408203, -7.313183784484863, -5.945713996887207, -4.578244209289551, -3.210775375366211, -1.8433055877685547, -0.47583580017089844, 0.8916337490081787, 2.259103298187256, 3.626572608947754, 4.99404239654541, 6.361512184143066, 7.728981018066406, 9.096450805664062, 10.463920593261719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 7.0, 9.0, 10.0, 12.0, 10.0, 18.0, 20.0, 24.0, 21.0, 27.0, 26.0, 36.0, 24.0, 31.0, 34.0, 31.0, 46.0, 42.0, 38.0, 57.0, 47.0, 30.0, 36.0, 45.0, 29.0, 29.0, 35.0, 21.0, 25.0, 25.0, 24.0, 12.0, 16.0, 10.0, 16.0, 10.0, 9.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.67646026611328, -27.801559448242188, -26.926660537719727, -26.051761627197266, -25.176860809326172, -24.301959991455078, -23.427061080932617, -22.552162170410156, -21.677261352539062, -20.80236053466797, -19.927461624145508, -19.052562713623047, -18.177661895751953, -17.30276107788086, -16.4278621673584, -15.552962303161621, -14.678062438964844, -13.803162574768066, -12.928262710571289, -12.053362846374512, -11.178462982177734, -10.303563117980957, -9.42866325378418, -8.553763389587402, -7.678863525390625, -6.803963661193848, -5.92906379699707, -5.054163932800293, -4.179264068603516, -3.3043642044067383, -2.429464340209961, -1.5545644760131836, -0.6796646118164062, 0.1952352523803711, 1.0701351165771484, 1.9450349807739258, 2.819934844970703, 3.6948347091674805, 4.569734573364258, 5.444634437561035, 6.3195343017578125, 7.19443416595459, 8.069334030151367, 8.944233894348145, 9.819133758544922, 10.6940336227417, 11.568933486938477, 12.443833351135254, 13.318733215332031, 14.193633079528809, 15.068532943725586, 15.943432807922363, 16.81833267211914, 17.693233489990234, 18.568132400512695, 19.443031311035156, 20.31793212890625, 21.192832946777344, 22.067731857299805, 22.942630767822266, 23.81753158569336, 24.692432403564453, 25.567331314086914, 26.442230224609375, 27.31713104248047]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 3.0, 8.0, 20.0, 12.0, 18.0, 11.0, 22.0, 21.0, 26.0, 23.0, 28.0, 31.0, 34.0, 47.0, 39.0, 35.0, 39.0, 54.0, 44.0, 41.0, 34.0, 34.0, 37.0, 41.0, 28.0, 25.0, 24.0, 30.0, 30.0, 27.0, 19.0, 15.0, 17.0, 11.0, 16.0, 8.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.591796875, -2.504302978515625, -2.41680908203125, -2.329315185546875, -2.2418212890625, -2.154327392578125, -2.06683349609375, -1.979339599609375, -1.891845703125, -1.804351806640625, -1.71685791015625, -1.629364013671875, -1.5418701171875, -1.454376220703125, -1.36688232421875, -1.279388427734375, -1.19189453125, -1.104400634765625, -1.01690673828125, -0.929412841796875, -0.8419189453125, -0.754425048828125, -0.66693115234375, -0.579437255859375, -0.491943359375, -0.404449462890625, -0.31695556640625, -0.229461669921875, -0.1419677734375, -0.054473876953125, 0.03302001953125, 0.120513916015625, 0.2080078125, 0.295501708984375, 0.38299560546875, 0.470489501953125, 0.5579833984375, 0.645477294921875, 0.73297119140625, 0.820465087890625, 0.907958984375, 0.995452880859375, 1.08294677734375, 1.170440673828125, 1.2579345703125, 1.345428466796875, 1.43292236328125, 1.520416259765625, 1.60791015625, 1.695404052734375, 1.78289794921875, 1.870391845703125, 1.9578857421875, 2.045379638671875, 2.13287353515625, 2.220367431640625, 2.307861328125, 2.395355224609375, 2.48284912109375, 2.570343017578125, 2.6578369140625, 2.745330810546875, 2.83282470703125, 2.920318603515625, 3.0078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 10.0, 12.0, 17.0, 34.0, 34.0, 60.0, 73.0, 98.0, 188.0, 291.0, 495.0, 775.0, 1493.0, 2776.0, 5475.0, 11854.0, 27869.0, 74028.0, 230865.0, 939437.0, 1982269.0, 650093.0, 166880.0, 57015.0, 22458.0, 9659.0, 4684.0, 2335.0, 1197.0, 716.0, 400.0, 261.0, 154.0, 102.0, 52.0, 48.0, 20.0, 14.0, 20.0, 10.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.05126953125, -3.8916015625, -3.73193359375, -3.572265625, -3.41259765625, -3.2529296875, -3.09326171875, -2.93359375, -2.77392578125, -2.6142578125, -2.45458984375, -2.294921875, -2.13525390625, -1.9755859375, -1.81591796875, -1.65625, -1.49658203125, -1.3369140625, -1.17724609375, -1.017578125, -0.85791015625, -0.6982421875, -0.53857421875, -0.37890625, -0.21923828125, -0.0595703125, 0.10009765625, 0.259765625, 0.41943359375, 0.5791015625, 0.73876953125, 0.8984375, 1.05810546875, 1.2177734375, 1.37744140625, 1.537109375, 1.69677734375, 1.8564453125, 2.01611328125, 2.17578125, 2.33544921875, 2.4951171875, 2.65478515625, 2.814453125, 2.97412109375, 3.1337890625, 3.29345703125, 3.453125, 3.61279296875, 3.7724609375, 3.93212890625, 4.091796875, 4.25146484375, 4.4111328125, 4.57080078125, 4.73046875, 4.89013671875, 5.0498046875, 5.20947265625, 5.369140625, 5.52880859375, 5.6884765625, 5.84814453125, 6.0078125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 10.0, 20.0, 15.0, 38.0, 63.0, 96.0, 158.0, 252.0, 435.0, 669.0, 781.0, 569.0, 370.0, 238.0, 135.0, 75.0, 60.0, 33.0, 25.0, 20.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5390625, -14.19573974609375, -13.8524169921875, -13.50909423828125, -13.165771484375, -12.82244873046875, -12.4791259765625, -12.13580322265625, -11.79248046875, -11.44915771484375, -11.1058349609375, -10.76251220703125, -10.419189453125, -10.07586669921875, -9.7325439453125, -9.38922119140625, -9.0458984375, -8.70257568359375, -8.3592529296875, -8.01593017578125, -7.672607421875, -7.32928466796875, -6.9859619140625, -6.64263916015625, -6.29931640625, -5.95599365234375, -5.6126708984375, -5.26934814453125, -4.926025390625, -4.58270263671875, -4.2393798828125, -3.89605712890625, -3.552734375, -3.20941162109375, -2.8660888671875, -2.52276611328125, -2.179443359375, -1.83612060546875, -1.4927978515625, -1.14947509765625, -0.80615234375, -0.46282958984375, -0.1195068359375, 0.22381591796875, 0.567138671875, 0.91046142578125, 1.2537841796875, 1.59710693359375, 1.9404296875, 2.28375244140625, 2.6270751953125, 2.97039794921875, 3.313720703125, 3.65704345703125, 4.0003662109375, 4.34368896484375, 4.68701171875, 5.03033447265625, 5.3736572265625, 5.71697998046875, 6.060302734375, 6.40362548828125, 6.7469482421875, 7.09027099609375, 7.43359375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 7.0, 10.0, 27.0, 42.0, 57.0, 92.0, 131.0, 253.0, 496.0, 1168.0, 4423.0, 30561.0, 378082.0, 3263506.0, 471677.0, 36182.0, 5182.0, 1254.0, 476.0, 240.0, 138.0, 97.0, 60.0, 30.0, 22.0, 16.0, 14.0, 4.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.4754638671875, -11.896240234375, -11.3170166015625, -10.73779296875, -10.1585693359375, -9.579345703125, -9.0001220703125, -8.4208984375, -7.8416748046875, -7.262451171875, -6.6832275390625, -6.10400390625, -5.5247802734375, -4.945556640625, -4.3663330078125, -3.787109375, -3.2078857421875, -2.628662109375, -2.0494384765625, -1.47021484375, -0.8909912109375, -0.311767578125, 0.2674560546875, 0.8466796875, 1.4259033203125, 2.005126953125, 2.5843505859375, 3.16357421875, 3.7427978515625, 4.322021484375, 4.9012451171875, 5.48046875, 6.0596923828125, 6.638916015625, 7.2181396484375, 7.79736328125, 8.3765869140625, 8.955810546875, 9.5350341796875, 10.1142578125, 10.6934814453125, 11.272705078125, 11.8519287109375, 12.43115234375, 13.0103759765625, 13.589599609375, 14.1688232421875, 14.748046875, 15.3272705078125, 15.906494140625, 16.4857177734375, 17.06494140625, 17.6441650390625, 18.223388671875, 18.8026123046875, 19.3818359375, 19.9610595703125, 20.540283203125, 21.1195068359375, 21.69873046875, 22.2779541015625, 22.857177734375, 23.4364013671875, 24.015625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 11.0, 9.0, 24.0, 38.0, 48.0, 53.0, 61.0, 70.0, 64.0, 89.0, 92.0, 83.0, 72.0, 65.0, 42.0, 41.0, 38.0, 24.0, 30.0, 20.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.303756713867188, -22.264781951904297, -21.225807189941406, -20.186832427978516, -19.147857666015625, -18.108882904052734, -17.069910049438477, -16.030935287475586, -14.991960525512695, -13.952985763549805, -12.914011001586914, -11.87503719329834, -10.83606243133545, -9.797087669372559, -8.758113861083984, -7.719139099121094, -6.680164337158203, -5.6411895751953125, -4.60221529006958, -3.5632407665252686, -2.524266242980957, -1.4852914810180664, -0.446317195892334, 0.5926570892333984, 1.631631851196289, 2.6706063747406006, 3.709580898284912, 4.7485551834106445, 5.787529945373535, 6.826504707336426, 7.865478992462158, 8.90445327758789, 9.943424224853516, 10.982398986816406, 12.021373748779297, 13.060347557067871, 14.099322319030762, 15.138297080993652, 16.177270889282227, 17.216245651245117, 18.255220413208008, 19.2941951751709, 20.33316993713379, 21.37214469909668, 22.411117553710938, 23.450092315673828, 24.48906707763672, 25.52804183959961, 26.5670166015625, 27.60599136352539, 28.64496612548828, 29.683940887451172, 30.722915649414062, 31.761890411376953, 32.800865173339844, 33.83983612060547, 34.878814697265625, 35.917789459228516, 36.956764221191406, 37.9957389831543, 39.03471374511719, 40.07368850708008, 41.11266326904297, 42.151634216308594, 43.190608978271484]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 6.0, 8.0, 13.0, 13.0, 7.0, 18.0, 13.0, 22.0, 18.0, 21.0, 24.0, 36.0, 28.0, 37.0, 43.0, 42.0, 45.0, 43.0, 34.0, 51.0, 42.0, 45.0, 40.0, 41.0, 36.0, 40.0, 24.0, 17.0, 30.0, 25.0, 24.0, 16.0, 15.0, 15.0, 15.0, 9.0, 7.0, 6.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.361984252929688, -24.618484497070312, -23.874982833862305, -23.13148307800293, -22.387981414794922, -21.644481658935547, -20.900981903076172, -20.157480239868164, -19.413978576660156, -18.67047882080078, -17.926977157592773, -17.1834774017334, -16.43997573852539, -15.696475982666016, -14.952975273132324, -14.209474563598633, -13.465974807739258, -12.722474098205566, -11.978973388671875, -11.2354736328125, -10.491971969604492, -9.748472213745117, -9.004971504211426, -8.261470794677734, -7.517970085144043, -6.774469375610352, -6.03096866607666, -5.287468433380127, -4.5439677238464355, -3.800467014312744, -3.056966781616211, -2.3134660720825195, -1.5699653625488281, -0.8264647722244263, -0.08296418190002441, 0.6605362892150879, 1.4040369987487793, 2.1475377082824707, 2.891037940979004, 3.6345386505126953, 4.378039360046387, 5.121540069580078, 5.8650407791137695, 6.608541011810303, 7.352041721343994, 8.095542907714844, 8.839042663574219, 9.58254337310791, 10.326044082641602, 11.069544792175293, 11.813045501708984, 12.55654525756836, 13.300046920776367, 14.043546676635742, 14.787047386169434, 15.530548095703125, 16.2740478515625, 17.017547607421875, 17.761049270629883, 18.504549026489258, 19.248050689697266, 19.99155044555664, 20.735050201416016, 21.478551864624023, 22.22205352783203]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 8.0, 6.0, 14.0, 18.0, 14.0, 23.0, 24.0, 32.0, 34.0, 26.0, 44.0, 44.0, 53.0, 48.0, 45.0, 55.0, 42.0, 52.0, 42.0, 39.0, 36.0, 42.0, 35.0, 35.0, 27.0, 29.0, 23.0, 22.0, 14.0, 17.0, 8.0, 13.0, 4.0, 8.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.60028076171875, -2.4974365234375, -2.39459228515625, -2.291748046875, -2.18890380859375, -2.0860595703125, -1.98321533203125, -1.88037109375, -1.77752685546875, -1.6746826171875, -1.57183837890625, -1.468994140625, -1.36614990234375, -1.2633056640625, -1.16046142578125, -1.0576171875, -0.95477294921875, -0.8519287109375, -0.74908447265625, -0.646240234375, -0.54339599609375, -0.4405517578125, -0.33770751953125, -0.23486328125, -0.13201904296875, -0.0291748046875, 0.07366943359375, 0.176513671875, 0.27935791015625, 0.3822021484375, 0.48504638671875, 0.587890625, 0.69073486328125, 0.7935791015625, 0.89642333984375, 0.999267578125, 1.10211181640625, 1.2049560546875, 1.30780029296875, 1.41064453125, 1.51348876953125, 1.6163330078125, 1.71917724609375, 1.822021484375, 1.92486572265625, 2.0277099609375, 2.13055419921875, 2.2333984375, 2.33624267578125, 2.4390869140625, 2.54193115234375, 2.644775390625, 2.74761962890625, 2.8504638671875, 2.95330810546875, 3.05615234375, 3.15899658203125, 3.2618408203125, 3.36468505859375, 3.467529296875, 3.57037353515625, 3.6732177734375, 3.77606201171875, 3.87890625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 25.0, 14.0, 41.0, 50.0, 81.0, 135.0, 232.0, 325.0, 531.0, 910.0, 1571.0, 2683.0, 4884.0, 9022.0, 16597.0, 32393.0, 65980.0, 160106.0, 448129.0, 165997.0, 68124.0, 32960.0, 17168.0, 8993.0, 4953.0, 2757.0, 1556.0, 944.0, 533.0, 325.0, 191.0, 116.0, 86.0, 46.0, 33.0, 11.0, 15.0, 6.0, 4.0, 2.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30859375, -0.2977714538574219, -0.28694915771484375, -0.2761268615722656, -0.2653045654296875, -0.2544822692871094, -0.24365997314453125, -0.23283767700195312, -0.222015380859375, -0.21119308471679688, -0.20037078857421875, -0.18954849243164062, -0.1787261962890625, -0.16790390014648438, -0.15708160400390625, -0.14625930786132812, -0.13543701171875, -0.12461471557617188, -0.11379241943359375, -0.10297012329101562, -0.0921478271484375, -0.08132553100585938, -0.07050323486328125, -0.059680938720703125, -0.048858642578125, -0.038036346435546875, -0.02721405029296875, -0.016391754150390625, -0.0055694580078125, 0.005252838134765625, 0.01607513427734375, 0.026897430419921875, 0.0377197265625, 0.048542022705078125, 0.05936431884765625, 0.07018661499023438, 0.0810089111328125, 0.09183120727539062, 0.10265350341796875, 0.11347579956054688, 0.124298095703125, 0.13512039184570312, 0.14594268798828125, 0.15676498413085938, 0.1675872802734375, 0.17840957641601562, 0.18923187255859375, 0.20005416870117188, 0.21087646484375, 0.22169876098632812, 0.23252105712890625, 0.24334335327148438, 0.2541656494140625, 0.2649879455566406, 0.27581024169921875, 0.2866325378417969, 0.297454833984375, 0.3082771301269531, 0.31909942626953125, 0.3299217224121094, 0.3407440185546875, 0.3515663146972656, 0.36238861083984375, 0.3732109069824219, 0.384033203125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 8.0, 6.0, 8.0, 16.0, 8.0, 15.0, 7.0, 22.0, 15.0, 19.0, 20.0, 30.0, 29.0, 50.0, 24.0, 40.0, 37.0, 42.0, 27.0, 43.0, 1054.0, 37.0, 35.0, 47.0, 35.0, 36.0, 38.0, 30.0, 25.0, 26.0, 25.0, 16.0, 20.0, 15.0, 18.0, 16.0, 13.0, 12.0, 8.0, 13.0, 7.0, 8.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9150390625, -1.8531036376953125, -1.791168212890625, -1.7292327880859375, -1.66729736328125, -1.6053619384765625, -1.543426513671875, -1.4814910888671875, -1.4195556640625, -1.3576202392578125, -1.295684814453125, -1.2337493896484375, -1.17181396484375, -1.1098785400390625, -1.047943115234375, -0.9860076904296875, -0.924072265625, -0.8621368408203125, -0.800201416015625, -0.7382659912109375, -0.67633056640625, -0.6143951416015625, -0.552459716796875, -0.4905242919921875, -0.4285888671875, -0.3666534423828125, -0.304718017578125, -0.2427825927734375, -0.18084716796875, -0.1189117431640625, -0.056976318359375, 0.0049591064453125, 0.06689453125, 0.1288299560546875, 0.190765380859375, 0.2527008056640625, 0.31463623046875, 0.3765716552734375, 0.438507080078125, 0.5004425048828125, 0.5623779296875, 0.6243133544921875, 0.686248779296875, 0.7481842041015625, 0.81011962890625, 0.8720550537109375, 0.933990478515625, 0.9959259033203125, 1.057861328125, 1.1197967529296875, 1.181732177734375, 1.2436676025390625, 1.30560302734375, 1.3675384521484375, 1.429473876953125, 1.4914093017578125, 1.5533447265625, 1.6152801513671875, 1.677215576171875, 1.7391510009765625, 1.80108642578125, 1.8630218505859375, 1.924957275390625, 1.9868927001953125, 2.048828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 8.0, 5.0, 13.0, 11.0, 35.0, 43.0, 49.0, 76.0, 112.0, 154.0, 266.0, 381.0, 474.0, 779.0, 1094.0, 1593.0, 2486.0, 3478.0, 5173.0, 7969.0, 12033.0, 18816.0, 30768.0, 53248.0, 99402.0, 236491.0, 1355028.0, 113484.0, 59309.0, 34223.0, 20992.0, 13210.0, 8541.0, 5651.0, 3717.0, 2556.0, 1721.0, 1209.0, 814.0, 535.0, 353.0, 269.0, 175.0, 136.0, 83.0, 53.0, 40.0, 36.0, 13.0, 9.0, 6.0, 10.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.1363525390625, -0.132232666015625, -0.12811279296875, -0.123992919921875, -0.119873046875, -0.115753173828125, -0.11163330078125, -0.107513427734375, -0.1033935546875, -0.099273681640625, -0.09515380859375, -0.091033935546875, -0.0869140625, -0.082794189453125, -0.07867431640625, -0.074554443359375, -0.0704345703125, -0.066314697265625, -0.06219482421875, -0.058074951171875, -0.053955078125, -0.049835205078125, -0.04571533203125, -0.041595458984375, -0.0374755859375, -0.033355712890625, -0.02923583984375, -0.025115966796875, -0.02099609375, -0.016876220703125, -0.01275634765625, -0.008636474609375, -0.0045166015625, -0.000396728515625, 0.00372314453125, 0.007843017578125, 0.011962890625, 0.016082763671875, 0.02020263671875, 0.024322509765625, 0.0284423828125, 0.032562255859375, 0.03668212890625, 0.040802001953125, 0.044921875, 0.049041748046875, 0.05316162109375, 0.057281494140625, 0.0614013671875, 0.065521240234375, 0.06964111328125, 0.073760986328125, 0.077880859375, 0.082000732421875, 0.08612060546875, 0.090240478515625, 0.0943603515625, 0.098480224609375, 0.10260009765625, 0.106719970703125, 0.11083984375, 0.114959716796875, 0.11907958984375, 0.123199462890625, 0.1273193359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 1.0, 8.0, 2.0, 10.0, 8.0, 8.0, 8.0, 13.0, 13.0, 20.0, 29.0, 32.0, 31.0, 60.0, 73.0, 98.0, 124.0, 109.0, 66.0, 62.0, 62.0, 28.0, 26.0, 26.0, 19.0, 15.0, 6.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9431114196777344e-05, -1.877918839454651e-05, -1.8127262592315674e-05, -1.747533679008484e-05, -1.6823410987854004e-05, -1.617148518562317e-05, -1.5519559383392334e-05, -1.4867633581161499e-05, -1.4215707778930664e-05, -1.3563781976699829e-05, -1.2911856174468994e-05, -1.225993037223816e-05, -1.1608004570007324e-05, -1.095607876777649e-05, -1.0304152965545654e-05, -9.65222716331482e-06, -9.000301361083984e-06, -8.34837555885315e-06, -7.696449756622314e-06, -7.0445239543914795e-06, -6.3925981521606445e-06, -5.7406723499298096e-06, -5.088746547698975e-06, -4.43682074546814e-06, -3.7848949432373047e-06, -3.1329691410064697e-06, -2.4810433387756348e-06, -1.8291175365447998e-06, -1.1771917343139648e-06, -5.252659320831299e-07, 1.2665987014770508e-07, 7.7858567237854e-07, 1.430511474609375e-06, 2.08243727684021e-06, 2.734363079071045e-06, 3.38628888130188e-06, 4.038214683532715e-06, 4.69014048576355e-06, 5.342066287994385e-06, 5.99399209022522e-06, 6.645917892456055e-06, 7.29784369468689e-06, 7.949769496917725e-06, 8.60169529914856e-06, 9.253621101379395e-06, 9.90554690361023e-06, 1.0557472705841064e-05, 1.12093985080719e-05, 1.1861324310302734e-05, 1.251325011253357e-05, 1.3165175914764404e-05, 1.381710171699524e-05, 1.4469027519226074e-05, 1.512095332145691e-05, 1.5772879123687744e-05, 1.642480492591858e-05, 1.7076730728149414e-05, 1.772865653038025e-05, 1.8380582332611084e-05, 1.903250813484192e-05, 1.9684433937072754e-05, 2.033635973930359e-05, 2.0988285541534424e-05, 2.164021134376526e-05, 2.2292137145996094e-05]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 5.0, 3.0, 11.0, 27.0, 28.0, 56.0, 88.0, 159.0, 539.0, 5151.0, 164002.0, 859364.0, 17318.0, 1217.0, 236.0, 118.0, 71.0, 30.0, 23.0, 13.0, 10.0, 11.0, 7.0, 7.0, 6.0, 5.0, 9.0, 0.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004360675811767578, -0.00042368099093437195, -0.0004112944006919861, -0.0003989078104496002, -0.00038652122020721436, -0.0003741346299648285, -0.0003617480397224426, -0.00034936144948005676, -0.0003369748592376709, -0.00032458826899528503, -0.00031220167875289917, -0.0002998150885105133, -0.00028742849826812744, -0.0002750419080257416, -0.0002626553177833557, -0.00025026872754096985, -0.00023788213729858398, -0.00022549554705619812, -0.00021310895681381226, -0.0002007223665714264, -0.00018833577632904053, -0.00017594918608665466, -0.0001635625958442688, -0.00015117600560188293, -0.00013878941535949707, -0.0001264028251171112, -0.00011401623487472534, -0.00010162964463233948, -8.924305438995361e-05, -7.685646414756775e-05, -6.446987390518188e-05, -5.208328366279602e-05, -3.9696693420410156e-05, -2.7310103178024292e-05, -1.4923512935638428e-05, -2.5369226932525635e-06, 9.8496675491333e-06, 2.2236257791519165e-05, 3.462284803390503e-05, 4.7009438276290894e-05, 5.939602851867676e-05, 7.178261876106262e-05, 8.416920900344849e-05, 9.655579924583435e-05, 0.00010894238948822021, 0.00012132897973060608, 0.00013371556997299194, 0.0001461021602153778, 0.00015848875045776367, 0.00017087534070014954, 0.0001832619309425354, 0.00019564852118492126, 0.00020803511142730713, 0.000220421701669693, 0.00023280829191207886, 0.0002451948821544647, 0.0002575814723968506, 0.00026996806263923645, 0.0002823546528816223, 0.0002947412431240082, 0.00030712783336639404, 0.0003195144236087799, 0.00033190101385116577, 0.00034428760409355164, 0.0003566741943359375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 12.0, 28.0, 81.0, 160.0, 244.0, 222.0, 134.0, 63.0, 31.0, 17.0, 11.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6518024494871497e-05, -1.532950409455225e-05, -1.4140984603727702e-05, -1.2952464203408454e-05, -1.1763944712583907e-05, -1.0575424312264659e-05, -9.38690391194541e-06, -8.198384421120863e-06, -7.009864020801615e-06, -5.821344075229717e-06, -4.63282412965782e-06, -3.4443037293385714e-06, -2.255783783766674e-06, -1.0672638381947763e-06, 1.212565621244721e-07, 1.3097760529490188e-06, 2.4982964532682672e-06, 3.6868163988401648e-06, 4.875336344412062e-06, 6.063856744731311e-06, 7.252376690303208e-06, 8.440896635875106e-06, 9.629417036194354e-06, 1.0817936527018901e-05, 1.200645692733815e-05, 1.3194977327657398e-05, 1.4383496818481945e-05, 1.5572017218801193e-05, 1.676053761912044e-05, 1.7949056200450286e-05, 1.9137576600769535e-05, 2.0326097001088783e-05, 2.151461740140803e-05, 2.270313780172728e-05, 2.389165820204653e-05, 2.5080178602365777e-05, 2.6268697183695622e-05, 2.745721758401487e-05, 2.864573798433412e-05, 2.9834256565663964e-05, 3.102277696598321e-05, 3.221129736630246e-05, 3.339981776662171e-05, 3.458833816694096e-05, 3.5776858567260206e-05, 3.6965378967579454e-05, 3.81538993678987e-05, 3.9342416130239144e-05, 4.05309401685372e-05, 4.171946056885645e-05, 4.2907980969175696e-05, 4.4096501369494945e-05, 4.528502176981419e-05, 4.647354217013344e-05, 4.766206257045269e-05, 4.885057933279313e-05, 5.003909973311238e-05, 5.122762013343163e-05, 5.241614053375088e-05, 5.3604660934070125e-05, 5.4793181334389374e-05, 5.5981698096729815e-05, 5.7170218497049063e-05, 5.835873889736831e-05, 5.954725929768756e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 8.0, 3.0, 5.0, 8.0, 10.0, 10.0, 9.0, 15.0, 22.0, 18.0, 21.0, 21.0, 23.0, 31.0, 36.0, 41.0, 27.0, 58.0, 34.0, 44.0, 47.0, 28.0, 56.0, 29.0, 50.0, 30.0, 42.0, 27.0, 40.0, 22.0, 25.0, 25.0, 24.0, 19.0, 12.0, 18.0, 6.0, 10.0, 8.0, 7.0, 5.0, 7.0, 8.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.821487426757812e-06, -8.550472557544708e-06, -8.279457688331604e-06, -8.0084428191185e-06, -7.737427949905396e-06, -7.466413080692291e-06, -7.195398211479187e-06, -6.924383342266083e-06, -6.6533684730529785e-06, -6.382353603839874e-06, -6.11133873462677e-06, -5.840323865413666e-06, -5.5693089962005615e-06, -5.298294126987457e-06, -5.027279257774353e-06, -4.756264388561249e-06, -4.4852495193481445e-06, -4.21423465013504e-06, -3.943219780921936e-06, -3.6722049117088318e-06, -3.4011900424957275e-06, -3.1301751732826233e-06, -2.859160304069519e-06, -2.588145434856415e-06, -2.3171305656433105e-06, -2.0461156964302063e-06, -1.775100827217102e-06, -1.5040859580039978e-06, -1.2330710887908936e-06, -9.620562195777893e-07, -6.910413503646851e-07, -4.200264811515808e-07, -1.4901161193847656e-07, 1.2200325727462769e-07, 3.9301812648773193e-07, 6.640329957008362e-07, 9.350478649139404e-07, 1.2060627341270447e-06, 1.477077603340149e-06, 1.7480924725532532e-06, 2.0191073417663574e-06, 2.2901222109794617e-06, 2.561137080192566e-06, 2.83215194940567e-06, 3.1031668186187744e-06, 3.3741816878318787e-06, 3.645196557044983e-06, 3.916211426258087e-06, 4.187226295471191e-06, 4.458241164684296e-06, 4.7292560338974e-06, 5.000270903110504e-06, 5.271285772323608e-06, 5.542300641536713e-06, 5.813315510749817e-06, 6.084330379962921e-06, 6.355345249176025e-06, 6.62636011838913e-06, 6.897374987602234e-06, 7.168389856815338e-06, 7.439404726028442e-06, 7.710419595241547e-06, 7.981434464454651e-06, 8.252449333667755e-06, 8.52346420288086e-06]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 8.0, 6.0, 14.0, 18.0, 14.0, 23.0, 24.0, 32.0, 34.0, 26.0, 44.0, 44.0, 53.0, 48.0, 45.0, 55.0, 42.0, 52.0, 42.0, 39.0, 36.0, 42.0, 35.0, 35.0, 27.0, 29.0, 23.0, 22.0, 14.0, 17.0, 8.0, 13.0, 4.0, 8.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.60028076171875, -2.4974365234375, -2.39459228515625, -2.291748046875, -2.18890380859375, -2.0860595703125, -1.98321533203125, -1.88037109375, -1.77752685546875, -1.6746826171875, -1.57183837890625, -1.468994140625, -1.36614990234375, -1.2633056640625, -1.16046142578125, -1.0576171875, -0.95477294921875, -0.8519287109375, -0.74908447265625, -0.646240234375, -0.54339599609375, -0.4405517578125, -0.33770751953125, -0.23486328125, -0.13201904296875, -0.0291748046875, 0.07366943359375, 0.176513671875, 0.27935791015625, 0.3822021484375, 0.48504638671875, 0.587890625, 0.69073486328125, 0.7935791015625, 0.89642333984375, 0.999267578125, 1.10211181640625, 1.2049560546875, 1.30780029296875, 1.41064453125, 1.51348876953125, 1.6163330078125, 1.71917724609375, 1.822021484375, 1.92486572265625, 2.0277099609375, 2.13055419921875, 2.2333984375, 2.33624267578125, 2.4390869140625, 2.54193115234375, 2.644775390625, 2.74761962890625, 2.8504638671875, 2.95330810546875, 3.05615234375, 3.15899658203125, 3.2618408203125, 3.36468505859375, 3.467529296875, 3.57037353515625, 3.6732177734375, 3.77606201171875, 3.87890625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 16.0, 15.0, 36.0, 56.0, 82.0, 130.0, 219.0, 371.0, 594.0, 918.0, 1562.0, 2608.0, 4506.0, 8267.0, 16313.0, 34312.0, 82070.0, 250491.0, 402573.0, 141131.0, 52308.0, 23490.0, 11816.0, 6082.0, 3398.0, 1984.0, 1229.0, 768.0, 455.0, 279.0, 180.0, 111.0, 65.0, 56.0, 28.0, 13.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.21234130859375, -4.0731201171875, -3.93389892578125, -3.794677734375, -3.65545654296875, -3.5162353515625, -3.37701416015625, -3.23779296875, -3.09857177734375, -2.9593505859375, -2.82012939453125, -2.680908203125, -2.54168701171875, -2.4024658203125, -2.26324462890625, -2.1240234375, -1.98480224609375, -1.8455810546875, -1.70635986328125, -1.567138671875, -1.42791748046875, -1.2886962890625, -1.14947509765625, -1.01025390625, -0.87103271484375, -0.7318115234375, -0.59259033203125, -0.453369140625, -0.31414794921875, -0.1749267578125, -0.03570556640625, 0.103515625, 0.24273681640625, 0.3819580078125, 0.52117919921875, 0.660400390625, 0.79962158203125, 0.9388427734375, 1.07806396484375, 1.21728515625, 1.35650634765625, 1.4957275390625, 1.63494873046875, 1.774169921875, 1.91339111328125, 2.0526123046875, 2.19183349609375, 2.3310546875, 2.47027587890625, 2.6094970703125, 2.74871826171875, 2.887939453125, 3.02716064453125, 3.1663818359375, 3.30560302734375, 3.44482421875, 3.58404541015625, 3.7232666015625, 3.86248779296875, 4.001708984375, 4.14093017578125, 4.2801513671875, 4.41937255859375, 4.55859375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 3.0, 8.0, 8.0, 17.0, 14.0, 16.0, 21.0, 17.0, 17.0, 24.0, 38.0, 42.0, 38.0, 58.0, 74.0, 115.0, 255.0, 1512.0, 200.0, 112.0, 80.0, 61.0, 52.0, 35.0, 35.0, 30.0, 36.0, 30.0, 17.0, 12.0, 12.0, 15.0, 10.0, 7.0, 7.0, 3.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.29345703125, -11.9150390625, -11.53662109375, -11.158203125, -10.77978515625, -10.4013671875, -10.02294921875, -9.64453125, -9.26611328125, -8.8876953125, -8.50927734375, -8.130859375, -7.75244140625, -7.3740234375, -6.99560546875, -6.6171875, -6.23876953125, -5.8603515625, -5.48193359375, -5.103515625, -4.72509765625, -4.3466796875, -3.96826171875, -3.58984375, -3.21142578125, -2.8330078125, -2.45458984375, -2.076171875, -1.69775390625, -1.3193359375, -0.94091796875, -0.5625, -0.18408203125, 0.1943359375, 0.57275390625, 0.951171875, 1.32958984375, 1.7080078125, 2.08642578125, 2.46484375, 2.84326171875, 3.2216796875, 3.60009765625, 3.978515625, 4.35693359375, 4.7353515625, 5.11376953125, 5.4921875, 5.87060546875, 6.2490234375, 6.62744140625, 7.005859375, 7.38427734375, 7.7626953125, 8.14111328125, 8.51953125, 8.89794921875, 9.2763671875, 9.65478515625, 10.033203125, 10.41162109375, 10.7900390625, 11.16845703125, 11.546875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 12.0, 7.0, 15.0, 20.0, 16.0, 26.0, 35.0, 51.0, 85.0, 91.0, 93.0, 176.0, 263.0, 466.0, 1830.0, 13077.0, 260744.0, 2779260.0, 81460.0, 5979.0, 957.0, 320.0, 179.0, 123.0, 99.0, 81.0, 71.0, 29.0, 25.0, 36.0, 18.0, 13.0, 12.0, 12.0, 2.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.121826171875, -18.44677734375, -17.771728515625, -17.0966796875, -16.421630859375, -15.74658203125, -15.071533203125, -14.396484375, -13.721435546875, -13.04638671875, -12.371337890625, -11.6962890625, -11.021240234375, -10.34619140625, -9.671142578125, -8.99609375, -8.321044921875, -7.64599609375, -6.970947265625, -6.2958984375, -5.620849609375, -4.94580078125, -4.270751953125, -3.595703125, -2.920654296875, -2.24560546875, -1.570556640625, -0.8955078125, -0.220458984375, 0.45458984375, 1.129638671875, 1.8046875, 2.479736328125, 3.15478515625, 3.829833984375, 4.5048828125, 5.179931640625, 5.85498046875, 6.530029296875, 7.205078125, 7.880126953125, 8.55517578125, 9.230224609375, 9.9052734375, 10.580322265625, 11.25537109375, 11.930419921875, 12.60546875, 13.280517578125, 13.95556640625, 14.630615234375, 15.3056640625, 15.980712890625, 16.65576171875, 17.330810546875, 18.005859375, 18.680908203125, 19.35595703125, 20.031005859375, 20.7060546875, 21.381103515625, 22.05615234375, 22.731201171875, 23.40625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [19.0, 303.0, 578.0, 117.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0822172164917, -6.789442539215088, -1.4966678619384766, 3.796107292175293, 9.088881492614746, 14.3816556930542, 19.67443084716797, 24.967205047607422, 30.259979248046875, 35.55275344848633, 40.84552764892578, 46.1383056640625, 51.43107604980469, 56.723854064941406, 62.01662826538086, 67.30940246582031, 72.60218048095703, 77.89495849609375, 83.18772888183594, 88.48050689697266, 93.77327728271484, 99.06605529785156, 104.35882568359375, 109.65160369873047, 114.94437408447266, 120.23715209960938, 125.52992248535156, 130.82269287109375, 136.115478515625, 141.4082489013672, 146.70101928710938, 151.99380493164062, 157.2865753173828, 162.579345703125, 167.87213134765625, 173.16490173339844, 178.45767211914062, 183.7504425048828, 189.04322814941406, 194.33599853515625, 199.62876892089844, 204.92153930664062, 210.21432495117188, 215.50709533691406, 220.79986572265625, 226.09263610839844, 231.3854217529297, 236.67819213867188, 241.97097778320312, 247.2637481689453, 252.55653381347656, 257.84930419921875, 263.14208984375, 268.4348449707031, 273.7276306152344, 279.0203857421875, 284.31317138671875, 289.60595703125, 294.8987121582031, 300.1914978027344, 305.4842834472656, 310.77703857421875, 316.06982421875, 321.36260986328125, 326.6553649902344]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 9.0, 7.0, 2.0, 11.0, 21.0, 20.0, 20.0, 28.0, 25.0, 22.0, 31.0, 35.0, 38.0, 43.0, 42.0, 39.0, 62.0, 48.0, 48.0, 52.0, 50.0, 42.0, 38.0, 43.0, 22.0, 30.0, 28.0, 16.0, 30.0, 22.0, 12.0, 15.0, 16.0, 6.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.731544494628906, -32.7323112487793, -31.733076095581055, -30.733840942382812, -29.734607696533203, -28.73537254333496, -27.73613739013672, -26.73690414428711, -25.7376708984375, -24.738435745239258, -23.73920249938965, -22.739967346191406, -21.740734100341797, -20.741498947143555, -19.742263793945312, -18.743030548095703, -17.74379539489746, -16.74456024169922, -15.74532699584961, -14.746091842651367, -13.746858596801758, -12.747623443603516, -11.74838924407959, -10.749155044555664, -9.749920845031738, -8.750686645507812, -7.751452445983887, -6.752217769622803, -5.752983570098877, -4.753749370574951, -3.754514694213867, -2.7552804946899414, -1.7560462951660156, -0.7568119764328003, 0.24242234230041504, 1.24165678024292, 2.2408909797668457, 3.2401251792907715, 4.2393598556518555, 5.238594055175781, 6.237828254699707, 7.237062454223633, 8.236296653747559, 9.235530853271484, 10.234766006469727, 11.233999252319336, 12.233234405517578, 13.232468605041504, 14.23170280456543, 15.230937004089355, 16.23017120361328, 17.229406356811523, 18.228639602661133, 19.227874755859375, 20.227108001708984, 21.226343154907227, 22.22557830810547, 23.22481346130371, 24.22404670715332, 25.223281860351562, 26.222515106201172, 27.221750259399414, 28.220985412597656, 29.220218658447266, 30.219451904296875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 5.0, 13.0, 6.0, 17.0, 19.0, 21.0, 26.0, 22.0, 41.0, 31.0, 37.0, 47.0, 59.0, 44.0, 48.0, 49.0, 48.0, 46.0, 38.0, 52.0, 44.0, 38.0, 29.0, 29.0, 30.0, 23.0, 21.0, 18.0, 24.0, 18.0, 10.0, 8.0, 11.0, 2.0, 3.0, 0.0, 2.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.735595703125, -2.62744140625, -2.519287109375, -2.4111328125, -2.302978515625, -2.19482421875, -2.086669921875, -1.978515625, -1.870361328125, -1.76220703125, -1.654052734375, -1.5458984375, -1.437744140625, -1.32958984375, -1.221435546875, -1.11328125, -1.005126953125, -0.89697265625, -0.788818359375, -0.6806640625, -0.572509765625, -0.46435546875, -0.356201171875, -0.248046875, -0.139892578125, -0.03173828125, 0.076416015625, 0.1845703125, 0.292724609375, 0.40087890625, 0.509033203125, 0.6171875, 0.725341796875, 0.83349609375, 0.941650390625, 1.0498046875, 1.157958984375, 1.26611328125, 1.374267578125, 1.482421875, 1.590576171875, 1.69873046875, 1.806884765625, 1.9150390625, 2.023193359375, 2.13134765625, 2.239501953125, 2.34765625, 2.455810546875, 2.56396484375, 2.672119140625, 2.7802734375, 2.888427734375, 2.99658203125, 3.104736328125, 3.212890625, 3.321044921875, 3.42919921875, 3.537353515625, 3.6455078125, 3.753662109375, 3.86181640625, 3.969970703125, 4.078125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 7.0, 12.0, 6.0, 6.0, 15.0, 18.0, 15.0, 27.0, 27.0, 32.0, 60.0, 136.0, 329.0, 814.0, 2629.0, 10058.0, 48771.0, 398912.0, 3016581.0, 630768.0, 66853.0, 13118.0, 3307.0, 945.0, 386.0, 139.0, 76.0, 40.0, 32.0, 22.0, 30.0, 18.0, 13.0, 12.0, 12.0, 9.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-10.578125, -10.2322998046875, -9.886474609375, -9.5406494140625, -9.19482421875, -8.8489990234375, -8.503173828125, -8.1573486328125, -7.8115234375, -7.4656982421875, -7.119873046875, -6.7740478515625, -6.42822265625, -6.0823974609375, -5.736572265625, -5.3907470703125, -5.044921875, -4.6990966796875, -4.353271484375, -4.0074462890625, -3.66162109375, -3.3157958984375, -2.969970703125, -2.6241455078125, -2.2783203125, -1.9324951171875, -1.586669921875, -1.2408447265625, -0.89501953125, -0.5491943359375, -0.203369140625, 0.1424560546875, 0.48828125, 0.8341064453125, 1.179931640625, 1.5257568359375, 1.87158203125, 2.2174072265625, 2.563232421875, 2.9090576171875, 3.2548828125, 3.6007080078125, 3.946533203125, 4.2923583984375, 4.63818359375, 4.9840087890625, 5.329833984375, 5.6756591796875, 6.021484375, 6.3673095703125, 6.713134765625, 7.0589599609375, 7.40478515625, 7.7506103515625, 8.096435546875, 8.4422607421875, 8.7880859375, 9.1339111328125, 9.479736328125, 9.8255615234375, 10.17138671875, 10.5172119140625, 10.863037109375, 11.2088623046875, 11.5546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 12.0, 23.0, 25.0, 47.0, 76.0, 100.0, 165.0, 270.0, 389.0, 548.0, 704.0, 592.0, 384.0, 270.0, 158.0, 109.0, 72.0, 35.0, 34.0, 21.0, 14.0, 6.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.71539306640625, -6.3878173828125, -6.06024169921875, -5.732666015625, -5.40509033203125, -5.0775146484375, -4.74993896484375, -4.42236328125, -4.09478759765625, -3.7672119140625, -3.43963623046875, -3.112060546875, -2.78448486328125, -2.4569091796875, -2.12933349609375, -1.8017578125, -1.47418212890625, -1.1466064453125, -0.81903076171875, -0.491455078125, -0.16387939453125, 0.1636962890625, 0.49127197265625, 0.81884765625, 1.14642333984375, 1.4739990234375, 1.80157470703125, 2.129150390625, 2.45672607421875, 2.7843017578125, 3.11187744140625, 3.439453125, 3.76702880859375, 4.0946044921875, 4.42218017578125, 4.749755859375, 5.07733154296875, 5.4049072265625, 5.73248291015625, 6.06005859375, 6.38763427734375, 6.7152099609375, 7.04278564453125, 7.370361328125, 7.69793701171875, 8.0255126953125, 8.35308837890625, 8.6806640625, 9.00823974609375, 9.3358154296875, 9.66339111328125, 9.990966796875, 10.31854248046875, 10.6461181640625, 10.97369384765625, 11.30126953125, 11.62884521484375, 11.9564208984375, 12.28399658203125, 12.611572265625, 12.93914794921875, 13.2667236328125, 13.59429931640625, 13.921875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 9.0, 8.0, 17.0, 23.0, 27.0, 44.0, 75.0, 107.0, 224.0, 465.0, 1487.0, 10914.0, 184101.0, 3426226.0, 543302.0, 23480.0, 2565.0, 624.0, 220.0, 149.0, 83.0, 53.0, 30.0, 22.0, 13.0, 10.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.703125, -24.96142578125, -24.2197265625, -23.47802734375, -22.736328125, -21.99462890625, -21.2529296875, -20.51123046875, -19.76953125, -19.02783203125, -18.2861328125, -17.54443359375, -16.802734375, -16.06103515625, -15.3193359375, -14.57763671875, -13.8359375, -13.09423828125, -12.3525390625, -11.61083984375, -10.869140625, -10.12744140625, -9.3857421875, -8.64404296875, -7.90234375, -7.16064453125, -6.4189453125, -5.67724609375, -4.935546875, -4.19384765625, -3.4521484375, -2.71044921875, -1.96875, -1.22705078125, -0.4853515625, 0.25634765625, 0.998046875, 1.73974609375, 2.4814453125, 3.22314453125, 3.96484375, 4.70654296875, 5.4482421875, 6.18994140625, 6.931640625, 7.67333984375, 8.4150390625, 9.15673828125, 9.8984375, 10.64013671875, 11.3818359375, 12.12353515625, 12.865234375, 13.60693359375, 14.3486328125, 15.09033203125, 15.83203125, 16.57373046875, 17.3154296875, 18.05712890625, 18.798828125, 19.54052734375, 20.2822265625, 21.02392578125, 21.765625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 19.0, 18.0, 24.0, 30.0, 64.0, 65.0, 86.0, 79.0, 102.0, 89.0, 115.0, 65.0, 70.0, 58.0, 32.0, 25.0, 23.0, 11.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.54084396362305, -34.31517028808594, -33.089500427246094, -31.863826751708984, -30.638154983520508, -29.41248321533203, -28.186809539794922, -26.961137771606445, -25.73546600341797, -24.509794235229492, -23.284122467041016, -22.058448791503906, -20.83277702331543, -19.607105255126953, -18.381431579589844, -17.155759811401367, -15.93008804321289, -14.704416275024414, -13.478743553161621, -12.253070831298828, -11.027399063110352, -9.801727294921875, -8.576054573059082, -7.350381851196289, -6.1247100830078125, -4.899037837982178, -3.673365592956543, -2.447693347930908, -1.2220211029052734, 0.003651142120361328, 1.229323387145996, 2.454996109008789, 3.6806678771972656, 4.9063401222229, 6.132012367248535, 7.35768461227417, 8.583356857299805, 9.809028625488281, 11.034701347351074, 12.260374069213867, 13.486045837402344, 14.71171760559082, 15.937390327453613, 17.163063049316406, 18.388734817504883, 19.61440658569336, 20.84008026123047, 22.065752029418945, 23.291423797607422, 24.5170955657959, 25.742767333984375, 26.968441009521484, 28.19411277770996, 29.419784545898438, 30.645458221435547, 31.871129989624023, 33.0968017578125, 34.32247543334961, 35.54814529418945, 36.77381896972656, 37.999488830566406, 39.225162506103516, 40.450836181640625, 41.67650604248047, 42.90217971801758]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 9.0, 4.0, 4.0, 12.0, 2.0, 15.0, 13.0, 17.0, 21.0, 20.0, 22.0, 33.0, 29.0, 36.0, 28.0, 34.0, 29.0, 39.0, 34.0, 37.0, 42.0, 40.0, 34.0, 25.0, 47.0, 33.0, 35.0, 30.0, 31.0, 37.0, 42.0, 24.0, 25.0, 21.0, 17.0, 11.0, 14.0, 11.0, 8.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.46881866455078, -22.735694885253906, -22.0025691986084, -21.26944351196289, -20.536319732666016, -19.80319595336914, -19.070070266723633, -18.336944580078125, -17.60382080078125, -16.870697021484375, -16.137571334838867, -15.404446601867676, -14.671321868896484, -13.938197135925293, -13.205072402954102, -12.47194766998291, -11.738822937011719, -11.005698204040527, -10.272573471069336, -9.539448738098145, -8.806324005126953, -8.073199272155762, -7.34007453918457, -6.606949806213379, -5.8738250732421875, -5.140700340270996, -4.407575607299805, -3.6744508743286133, -2.941326141357422, -2.2082014083862305, -1.475076675415039, -0.7419519424438477, -0.00882720947265625, 0.7242975234985352, 1.4574222564697266, 2.190546989440918, 2.9236717224121094, 3.656796455383301, 4.389921188354492, 5.123045921325684, 5.856170654296875, 6.589295387268066, 7.322420120239258, 8.05554485321045, 8.78866958618164, 9.521794319152832, 10.254919052124023, 10.988043785095215, 11.721168518066406, 12.454293251037598, 13.187417984008789, 13.92054271697998, 14.653667449951172, 15.386792182922363, 16.119916915893555, 16.853042602539062, 17.586166381835938, 18.319290161132812, 19.05241584777832, 19.785541534423828, 20.518665313720703, 21.251789093017578, 21.984914779663086, 22.718040466308594, 23.45116424560547]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 7.0, 6.0, 14.0, 12.0, 12.0, 24.0, 20.0, 31.0, 37.0, 39.0, 46.0, 37.0, 51.0, 53.0, 35.0, 54.0, 53.0, 46.0, 57.0, 42.0, 41.0, 30.0, 42.0, 31.0, 25.0, 20.0, 19.0, 20.0, 13.0, 20.0, 13.0, 10.0, 8.0, 1.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.906585693359375, -2.79559326171875, -2.684600830078125, -2.5736083984375, -2.462615966796875, -2.35162353515625, -2.240631103515625, -2.129638671875, -2.018646240234375, -1.90765380859375, -1.796661376953125, -1.6856689453125, -1.574676513671875, -1.46368408203125, -1.352691650390625, -1.24169921875, -1.130706787109375, -1.01971435546875, -0.908721923828125, -0.7977294921875, -0.686737060546875, -0.57574462890625, -0.464752197265625, -0.353759765625, -0.242767333984375, -0.13177490234375, -0.020782470703125, 0.0902099609375, 0.201202392578125, 0.31219482421875, 0.423187255859375, 0.5341796875, 0.645172119140625, 0.75616455078125, 0.867156982421875, 0.9781494140625, 1.089141845703125, 1.20013427734375, 1.311126708984375, 1.422119140625, 1.533111572265625, 1.64410400390625, 1.755096435546875, 1.8660888671875, 1.977081298828125, 2.08807373046875, 2.199066162109375, 2.31005859375, 2.421051025390625, 2.53204345703125, 2.643035888671875, 2.7540283203125, 2.865020751953125, 2.97601318359375, 3.087005615234375, 3.197998046875, 3.308990478515625, 3.41998291015625, 3.530975341796875, 3.6419677734375, 3.752960205078125, 3.86395263671875, 3.974945068359375, 4.0859375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 8.0, 9.0, 19.0, 36.0, 48.0, 50.0, 110.0, 165.0, 247.0, 414.0, 558.0, 867.0, 1527.0, 2339.0, 3706.0, 6082.0, 10026.0, 17355.0, 30159.0, 55548.0, 110554.0, 346332.0, 249615.0, 96628.0, 49156.0, 27155.0, 15755.0, 9183.0, 5671.0, 3419.0, 2100.0, 1332.0, 826.0, 541.0, 371.0, 207.0, 152.0, 87.0, 62.0, 48.0, 39.0, 19.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.32666015625, -0.3173027038574219, -0.30794525146484375, -0.2985877990722656, -0.2892303466796875, -0.2798728942871094, -0.27051544189453125, -0.2611579895019531, -0.251800537109375, -0.24244308471679688, -0.23308563232421875, -0.22372817993164062, -0.2143707275390625, -0.20501327514648438, -0.19565582275390625, -0.18629837036132812, -0.17694091796875, -0.16758346557617188, -0.15822601318359375, -0.14886856079101562, -0.1395111083984375, -0.13015365600585938, -0.12079620361328125, -0.11143875122070312, -0.102081298828125, -0.09272384643554688, -0.08336639404296875, -0.07400894165039062, -0.0646514892578125, -0.055294036865234375, -0.04593658447265625, -0.036579132080078125, -0.0272216796875, -0.017864227294921875, -0.00850677490234375, 0.000850677490234375, 0.0102081298828125, 0.019565582275390625, 0.02892303466796875, 0.038280487060546875, 0.047637939453125, 0.056995391845703125, 0.06635284423828125, 0.07571029663085938, 0.0850677490234375, 0.09442520141601562, 0.10378265380859375, 0.11314010620117188, 0.12249755859375, 0.13185501098632812, 0.14121246337890625, 0.15056991577148438, 0.1599273681640625, 0.16928482055664062, 0.17864227294921875, 0.18799972534179688, 0.197357177734375, 0.20671463012695312, 0.21607208251953125, 0.22542953491210938, 0.2347869873046875, 0.24414443969726562, 0.25350189208984375, 0.2628593444824219, 0.272216796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 9.0, 9.0, 15.0, 15.0, 29.0, 23.0, 28.0, 28.0, 25.0, 31.0, 27.0, 36.0, 30.0, 37.0, 47.0, 33.0, 1064.0, 47.0, 46.0, 37.0, 29.0, 32.0, 41.0, 36.0, 29.0, 26.0, 22.0, 23.0, 21.0, 19.0, 13.0, 11.0, 22.0, 12.0, 6.0, 9.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.278045654296875, -2.20648193359375, -2.134918212890625, -2.0633544921875, -1.991790771484375, -1.92022705078125, -1.848663330078125, -1.777099609375, -1.705535888671875, -1.63397216796875, -1.562408447265625, -1.4908447265625, -1.419281005859375, -1.34771728515625, -1.276153564453125, -1.20458984375, -1.133026123046875, -1.06146240234375, -0.989898681640625, -0.9183349609375, -0.846771240234375, -0.77520751953125, -0.703643798828125, -0.632080078125, -0.560516357421875, -0.48895263671875, -0.417388916015625, -0.3458251953125, -0.274261474609375, -0.20269775390625, -0.131134033203125, -0.0595703125, 0.011993408203125, 0.08355712890625, 0.155120849609375, 0.2266845703125, 0.298248291015625, 0.36981201171875, 0.441375732421875, 0.512939453125, 0.584503173828125, 0.65606689453125, 0.727630615234375, 0.7991943359375, 0.870758056640625, 0.94232177734375, 1.013885498046875, 1.08544921875, 1.157012939453125, 1.22857666015625, 1.300140380859375, 1.3717041015625, 1.443267822265625, 1.51483154296875, 1.586395263671875, 1.657958984375, 1.729522705078125, 1.80108642578125, 1.872650146484375, 1.9442138671875, 2.015777587890625, 2.08734130859375, 2.158905029296875, 2.23046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 10.0, 18.0, 19.0, 25.0, 46.0, 71.0, 93.0, 141.0, 215.0, 290.0, 446.0, 592.0, 944.0, 1426.0, 2078.0, 3162.0, 4781.0, 7525.0, 11457.0, 18480.0, 30804.0, 53500.0, 97931.0, 247169.0, 1361643.0, 108446.0, 57000.0, 33346.0, 20176.0, 12486.0, 7781.0, 5044.0, 3343.0, 2122.0, 1491.0, 931.0, 693.0, 438.0, 315.0, 189.0, 146.0, 89.0, 64.0, 61.0, 30.0, 19.0, 22.0, 15.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1488037109375, -0.1440143585205078, -0.13922500610351562, -0.13443565368652344, -0.12964630126953125, -0.12485694885253906, -0.12006759643554688, -0.11527824401855469, -0.1104888916015625, -0.10569953918457031, -0.10091018676757812, -0.09612083435058594, -0.09133148193359375, -0.08654212951660156, -0.08175277709960938, -0.07696342468261719, -0.072174072265625, -0.06738471984863281, -0.06259536743164062, -0.05780601501464844, -0.05301666259765625, -0.04822731018066406, -0.043437957763671875, -0.03864860534667969, -0.0338592529296875, -0.029069900512695312, -0.024280548095703125, -0.019491195678710938, -0.01470184326171875, -0.009912490844726562, -0.005123138427734375, -0.0003337860107421875, 0.00445556640625, 0.009244918823242188, 0.014034271240234375, 0.018823623657226562, 0.02361297607421875, 0.028402328491210938, 0.033191680908203125, 0.03798103332519531, 0.0427703857421875, 0.04755973815917969, 0.052349090576171875, 0.05713844299316406, 0.06192779541015625, 0.06671714782714844, 0.07150650024414062, 0.07629585266113281, 0.081085205078125, 0.08587455749511719, 0.09066390991210938, 0.09545326232910156, 0.10024261474609375, 0.10503196716308594, 0.10982131958007812, 0.11461067199707031, 0.1194000244140625, 0.12418937683105469, 0.12897872924804688, 0.13376808166503906, 0.13855743408203125, 0.14334678649902344, 0.14813613891601562, 0.1529254913330078, 0.15771484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 8.0, 7.0, 10.0, 9.0, 17.0, 27.0, 28.0, 60.0, 83.0, 123.0, 201.0, 130.0, 81.0, 56.0, 40.0, 29.0, 22.0, 14.0, 7.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.170967102050781e-05, -3.093015402555466e-05, -3.01506370306015e-05, -2.9371120035648346e-05, -2.859160304069519e-05, -2.7812086045742035e-05, -2.703256905078888e-05, -2.6253052055835724e-05, -2.547353506088257e-05, -2.4694018065929413e-05, -2.3914501070976257e-05, -2.3134984076023102e-05, -2.2355467081069946e-05, -2.157595008611679e-05, -2.0796433091163635e-05, -2.001691609621048e-05, -1.9237399101257324e-05, -1.845788210630417e-05, -1.7678365111351013e-05, -1.6898848116397858e-05, -1.6119331121444702e-05, -1.5339814126491547e-05, -1.4560297131538391e-05, -1.3780780136585236e-05, -1.300126314163208e-05, -1.2221746146678925e-05, -1.1442229151725769e-05, -1.0662712156772614e-05, -9.883195161819458e-06, -9.103678166866302e-06, -8.324161171913147e-06, -7.5446441769599915e-06, -6.765127182006836e-06, -5.98561018705368e-06, -5.206093192100525e-06, -4.426576197147369e-06, -3.647059202194214e-06, -2.8675422072410583e-06, -2.088025212287903e-06, -1.3085082173347473e-06, -5.289912223815918e-07, 2.505257725715637e-07, 1.0300427675247192e-06, 1.8095597624778748e-06, 2.5890767574310303e-06, 3.368593752384186e-06, 4.148110747337341e-06, 4.927627742290497e-06, 5.707144737243652e-06, 6.486661732196808e-06, 7.266178727149963e-06, 8.045695722103119e-06, 8.825212717056274e-06, 9.60472971200943e-06, 1.0384246706962585e-05, 1.1163763701915741e-05, 1.1943280696868896e-05, 1.2722797691822052e-05, 1.3502314686775208e-05, 1.4281831681728363e-05, 1.5061348676681519e-05, 1.5840865671634674e-05, 1.662038266658783e-05, 1.7399899661540985e-05, 1.817941665649414e-05]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 8.0, 6.0, 9.0, 7.0, 9.0, 29.0, 45.0, 108.0, 339.0, 2656.0, 69046.0, 947072.0, 27287.0, 1489.0, 217.0, 101.0, 42.0, 22.0, 14.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003304481506347656, -0.0003163143992424011, -0.0003021806478500366, -0.0002880468964576721, -0.0002739131450653076, -0.0002597793936729431, -0.0002456456422805786, -0.0002315118908882141, -0.0002173781394958496, -0.0002032443881034851, -0.0001891106367111206, -0.0001749768853187561, -0.0001608431339263916, -0.0001467093825340271, -0.0001325756311416626, -0.0001184418797492981, -0.0001043081283569336, -9.017437696456909e-05, -7.604062557220459e-05, -6.190687417984009e-05, -4.7773122787475586e-05, -3.3639371395111084e-05, -1.9505620002746582e-05, -5.37186861038208e-06, 8.761882781982422e-06, 2.2895634174346924e-05, 3.7029385566711426e-05, 5.116313695907593e-05, 6.529688835144043e-05, 7.943063974380493e-05, 9.356439113616943e-05, 0.00010769814252853394, 0.00012183189392089844, 0.00013596564531326294, 0.00015009939670562744, 0.00016423314809799194, 0.00017836689949035645, 0.00019250065088272095, 0.00020663440227508545, 0.00022076815366744995, 0.00023490190505981445, 0.00024903565645217896, 0.00026316940784454346, 0.00027730315923690796, 0.00029143691062927246, 0.00030557066202163696, 0.00031970441341400146, 0.00033383816480636597, 0.00034797191619873047, 0.00036210566759109497, 0.00037623941898345947, 0.000390373170375824, 0.0004045069217681885, 0.000418640673160553, 0.0004327744245529175, 0.000446908175945282, 0.0004610419273376465, 0.000475175678730011, 0.0004893094301223755, 0.00050344318151474, 0.0005175769329071045, 0.000531710684299469, 0.0005458444356918335, 0.000559978187084198, 0.0005741119384765625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 24.0, 47.0, 66.0, 109.0, 155.0, 165.0, 149.0, 104.0, 69.0, 44.0, 20.0, 16.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0268806110834703e-05, -1.9371320377103984e-05, -1.847383646236267e-05, -1.757635072863195e-05, -1.6678864994901232e-05, -1.5781381080159917e-05, -1.4883895346429199e-05, -1.398640961269848e-05, -1.3088924788462464e-05, -1.2191439964226447e-05, -1.1293954230495729e-05, -1.0396469406259712e-05, -9.498984582023695e-06, -8.601498848292977e-06, -7.70401402405696e-06, -6.806528745073592e-06, -5.909043466090225e-06, -5.011558187106857e-06, -4.1140729081234895e-06, -3.2165880838874727e-06, -2.319102804904105e-06, -1.4216175259207375e-06, -5.241327016847208e-07, 3.733525772986468e-07, 1.2708378562820144e-06, 2.168323135265382e-06, 3.065808186875074e-06, 3.963293238484766e-06, 4.860778517468134e-06, 5.7582637964515015e-06, 6.655748620687518e-06, 7.553233899670886e-06, 8.450719178654253e-06, 9.34820400289027e-06, 1.0245689736620989e-05, 1.1143174560857005e-05, 1.2040660294587724e-05, 1.293814511882374e-05, 1.3835629943059757e-05, 1.4733115676790476e-05, 1.5630601410521194e-05, 1.6528087144251913e-05, 1.7425571058993228e-05, 1.8323056792723946e-05, 1.9220542526454665e-05, 2.011802644119598e-05, 2.1015512174926698e-05, 2.1912997908657417e-05, 2.281048182339873e-05, 2.370796755712945e-05, 2.4605451471870765e-05, 2.5502937205601484e-05, 2.6400422939332202e-05, 2.729790867306292e-05, 2.8195392587804236e-05, 2.9092878321534954e-05, 2.999036223627627e-05, 3.088784797000699e-05, 3.1785333703737706e-05, 3.268281579948962e-05, 3.3580301533220336e-05, 3.4477787266951054e-05, 3.537527300068177e-05, 3.627275873441249e-05, 3.717024446814321e-05]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 8.0, 10.0, 13.0, 10.0, 19.0, 17.0, 24.0, 20.0, 26.0, 31.0, 36.0, 35.0, 37.0, 47.0, 45.0, 45.0, 47.0, 51.0, 39.0, 43.0, 54.0, 30.0, 36.0, 28.0, 34.0, 38.0, 28.0, 30.0, 22.0, 15.0, 13.0, 12.0, 9.0, 7.0, 6.0, 6.0, 5.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.126029908657074e-06, -8.83452594280243e-06, -8.543021976947784e-06, -8.25151801109314e-06, -7.960014045238495e-06, -7.66851007938385e-06, -7.377006113529205e-06, -7.0855021476745605e-06, -6.793998181819916e-06, -6.502494215965271e-06, -6.210990250110626e-06, -5.9194862842559814e-06, -5.627982318401337e-06, -5.336478352546692e-06, -5.044974386692047e-06, -4.753470420837402e-06, -4.4619664549827576e-06, -4.170462489128113e-06, -3.878958523273468e-06, -3.5874545574188232e-06, -3.2959505915641785e-06, -3.0044466257095337e-06, -2.712942659854889e-06, -2.421438694000244e-06, -2.1299347281455994e-06, -1.8384307622909546e-06, -1.5469267964363098e-06, -1.255422830581665e-06, -9.639188647270203e-07, -6.724148988723755e-07, -3.809109330177307e-07, -8.940696716308594e-08, 2.0209699869155884e-07, 4.936009645462036e-07, 7.851049304008484e-07, 1.0766088962554932e-06, 1.368112862110138e-06, 1.6596168279647827e-06, 1.9511207938194275e-06, 2.2426247596740723e-06, 2.534128725528717e-06, 2.825632691383362e-06, 3.1171366572380066e-06, 3.4086406230926514e-06, 3.700144588947296e-06, 3.991648554801941e-06, 4.283152520656586e-06, 4.5746564865112305e-06, 4.866160452365875e-06, 5.15766441822052e-06, 5.449168384075165e-06, 5.7406723499298096e-06, 6.032176315784454e-06, 6.323680281639099e-06, 6.615184247493744e-06, 6.906688213348389e-06, 7.1981921792030334e-06, 7.489696145057678e-06, 7.781200110912323e-06, 8.072704076766968e-06, 8.364208042621613e-06, 8.655712008476257e-06, 8.947215974330902e-06, 9.238719940185547e-06]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 7.0, 6.0, 14.0, 12.0, 12.0, 24.0, 20.0, 31.0, 37.0, 39.0, 46.0, 37.0, 51.0, 53.0, 35.0, 54.0, 53.0, 46.0, 57.0, 42.0, 41.0, 30.0, 42.0, 31.0, 25.0, 20.0, 19.0, 20.0, 13.0, 20.0, 13.0, 10.0, 8.0, 1.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.906585693359375, -2.79559326171875, -2.684600830078125, -2.5736083984375, -2.462615966796875, -2.35162353515625, -2.240631103515625, -2.129638671875, -2.018646240234375, -1.90765380859375, -1.796661376953125, -1.6856689453125, -1.574676513671875, -1.46368408203125, -1.352691650390625, -1.24169921875, -1.130706787109375, -1.01971435546875, -0.908721923828125, -0.7977294921875, -0.686737060546875, -0.57574462890625, -0.464752197265625, -0.353759765625, -0.242767333984375, -0.13177490234375, -0.020782470703125, 0.0902099609375, 0.201202392578125, 0.31219482421875, 0.423187255859375, 0.5341796875, 0.645172119140625, 0.75616455078125, 0.867156982421875, 0.9781494140625, 1.089141845703125, 1.20013427734375, 1.311126708984375, 1.422119140625, 1.533111572265625, 1.64410400390625, 1.755096435546875, 1.8660888671875, 1.977081298828125, 2.08807373046875, 2.199066162109375, 2.31005859375, 2.421051025390625, 2.53204345703125, 2.643035888671875, 2.7540283203125, 2.865020751953125, 2.97601318359375, 3.087005615234375, 3.197998046875, 3.308990478515625, 3.41998291015625, 3.530975341796875, 3.6419677734375, 3.752960205078125, 3.86395263671875, 3.974945068359375, 4.0859375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 15.0, 11.0, 19.0, 46.0, 77.0, 123.0, 190.0, 278.0, 492.0, 887.0, 1512.0, 2596.0, 4263.0, 7515.0, 13012.0, 23341.0, 43544.0, 93060.0, 251015.0, 350131.0, 132012.0, 56895.0, 29367.0, 16150.0, 9302.0, 5266.0, 2983.0, 1749.0, 1098.0, 639.0, 352.0, 244.0, 131.0, 92.0, 50.0, 37.0, 19.0, 12.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.81524658203125, -4.6656494140625, -4.51605224609375, -4.366455078125, -4.21685791015625, -4.0672607421875, -3.91766357421875, -3.76806640625, -3.61846923828125, -3.4688720703125, -3.31927490234375, -3.169677734375, -3.02008056640625, -2.8704833984375, -2.72088623046875, -2.5712890625, -2.42169189453125, -2.2720947265625, -2.12249755859375, -1.972900390625, -1.82330322265625, -1.6737060546875, -1.52410888671875, -1.37451171875, -1.22491455078125, -1.0753173828125, -0.92572021484375, -0.776123046875, -0.62652587890625, -0.4769287109375, -0.32733154296875, -0.177734375, -0.02813720703125, 0.1214599609375, 0.27105712890625, 0.420654296875, 0.57025146484375, 0.7198486328125, 0.86944580078125, 1.01904296875, 1.16864013671875, 1.3182373046875, 1.46783447265625, 1.617431640625, 1.76702880859375, 1.9166259765625, 2.06622314453125, 2.2158203125, 2.36541748046875, 2.5150146484375, 2.66461181640625, 2.814208984375, 2.96380615234375, 3.1134033203125, 3.26300048828125, 3.41259765625, 3.56219482421875, 3.7117919921875, 3.86138916015625, 4.010986328125, 4.16058349609375, 4.3101806640625, 4.45977783203125, 4.609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 5.0, 9.0, 5.0, 9.0, 12.0, 20.0, 15.0, 14.0, 19.0, 35.0, 23.0, 38.0, 38.0, 40.0, 44.0, 66.0, 79.0, 175.0, 1358.0, 366.0, 188.0, 79.0, 50.0, 44.0, 44.0, 37.0, 34.0, 27.0, 19.0, 17.0, 16.0, 20.0, 19.0, 14.0, 11.0, 13.0, 5.0, 6.0, 10.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.828125, -8.5128173828125, -8.197509765625, -7.8822021484375, -7.56689453125, -7.2515869140625, -6.936279296875, -6.6209716796875, -6.3056640625, -5.9903564453125, -5.675048828125, -5.3597412109375, -5.04443359375, -4.7291259765625, -4.413818359375, -4.0985107421875, -3.783203125, -3.4678955078125, -3.152587890625, -2.8372802734375, -2.52197265625, -2.2066650390625, -1.891357421875, -1.5760498046875, -1.2607421875, -0.9454345703125, -0.630126953125, -0.3148193359375, 0.00048828125, 0.3157958984375, 0.631103515625, 0.9464111328125, 1.26171875, 1.5770263671875, 1.892333984375, 2.2076416015625, 2.52294921875, 2.8382568359375, 3.153564453125, 3.4688720703125, 3.7841796875, 4.0994873046875, 4.414794921875, 4.7301025390625, 5.04541015625, 5.3607177734375, 5.676025390625, 5.9913330078125, 6.306640625, 6.6219482421875, 6.937255859375, 7.2525634765625, 7.56787109375, 7.8831787109375, 8.198486328125, 8.5137939453125, 8.8291015625, 9.1444091796875, 9.459716796875, 9.7750244140625, 10.09033203125, 10.4056396484375, 10.720947265625, 11.0362548828125, 11.3515625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 4.0, 13.0, 10.0, 18.0, 18.0, 37.0, 43.0, 42.0, 46.0, 75.0, 99.0, 140.0, 199.0, 362.0, 1056.0, 5586.0, 49725.0, 2323189.0, 732693.0, 27134.0, 3449.0, 753.0, 308.0, 169.0, 135.0, 82.0, 77.0, 52.0, 46.0, 39.0, 16.0, 20.0, 19.0, 5.0, 9.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.078125, -21.445068359375, -20.81201171875, -20.178955078125, -19.5458984375, -18.912841796875, -18.27978515625, -17.646728515625, -17.013671875, -16.380615234375, -15.74755859375, -15.114501953125, -14.4814453125, -13.848388671875, -13.21533203125, -12.582275390625, -11.94921875, -11.316162109375, -10.68310546875, -10.050048828125, -9.4169921875, -8.783935546875, -8.15087890625, -7.517822265625, -6.884765625, -6.251708984375, -5.61865234375, -4.985595703125, -4.3525390625, -3.719482421875, -3.08642578125, -2.453369140625, -1.8203125, -1.187255859375, -0.55419921875, 0.078857421875, 0.7119140625, 1.344970703125, 1.97802734375, 2.611083984375, 3.244140625, 3.877197265625, 4.51025390625, 5.143310546875, 5.7763671875, 6.409423828125, 7.04248046875, 7.675537109375, 8.30859375, 8.941650390625, 9.57470703125, 10.207763671875, 10.8408203125, 11.473876953125, 12.10693359375, 12.739990234375, 13.373046875, 14.006103515625, 14.63916015625, 15.272216796875, 15.9052734375, 16.538330078125, 17.17138671875, 17.804443359375, 18.4375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [6.0, 77.0, 489.0, 399.0, 45.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.255545616149902, -8.733220100402832, -4.210894584655762, 0.3114309310913086, 4.833756446838379, 9.35608196258545, 13.87840747833252, 18.400733947753906, 22.923057556152344, 27.445383071899414, 31.967708587646484, 36.49003601074219, 41.012359619140625, 45.53468322753906, 50.057010650634766, 54.57933807373047, 59.101661682128906, 63.623985290527344, 68.14631652832031, 72.66864013671875, 77.19096374511719, 81.71328735351562, 86.23561096191406, 90.75794219970703, 95.28026580810547, 99.8025894165039, 104.32492065429688, 108.84724426269531, 113.36956787109375, 117.89189147949219, 122.41421508789062, 126.9365463256836, 131.4588623046875, 135.98118591308594, 140.50350952148438, 145.0258331298828, 149.54815673828125, 154.07049560546875, 158.5928192138672, 163.11514282226562, 167.63746643066406, 172.1597900390625, 176.68211364746094, 181.20443725585938, 185.72677612304688, 190.2490997314453, 194.77142333984375, 199.2937469482422, 203.81607055664062, 208.33839416503906, 212.8607177734375, 217.38304138183594, 221.90536499023438, 226.42770385742188, 230.9500274658203, 235.47235107421875, 239.9946746826172, 244.51699829101562, 249.03932189941406, 253.5616455078125, 258.083984375, 262.6062927246094, 267.1286315917969, 271.65093994140625, 276.17327880859375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 8.0, 6.0, 10.0, 12.0, 9.0, 11.0, 11.0, 16.0, 21.0, 27.0, 20.0, 20.0, 33.0, 24.0, 33.0, 26.0, 30.0, 24.0, 40.0, 36.0, 37.0, 46.0, 49.0, 42.0, 39.0, 28.0, 34.0, 28.0, 36.0, 25.0, 34.0, 22.0, 22.0, 16.0, 25.0, 15.0, 11.0, 22.0, 4.0, 13.0, 8.0, 7.0, 8.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.27646255493164, -26.377737045288086, -25.4790096282959, -24.580284118652344, -23.68155860900879, -22.7828311920166, -21.884105682373047, -20.98537826538086, -20.086652755737305, -19.18792724609375, -18.289199829101562, -17.390474319458008, -16.491748809814453, -15.593021392822266, -14.694295883178711, -13.79556941986084, -12.896843910217285, -11.998117446899414, -11.09939193725586, -10.200665473937988, -9.301939010620117, -8.403213500976562, -7.504487037658691, -6.60576057434082, -5.707034587860107, -4.8083086013793945, -3.9095821380615234, -3.0108561515808105, -2.1121299266815186, -1.2134037017822266, -0.31467771530151367, 0.5840487480163574, 1.4827747344970703, 2.3815009593963623, 3.2802271842956543, 4.178953170776367, 5.077679634094238, 5.976405620574951, 6.875131607055664, 7.773858070373535, 8.672584533691406, 9.571310997009277, 10.470036506652832, 11.368762969970703, 12.267489433288574, 13.166215896606445, 14.06494140625, 14.963667869567871, 15.862393379211426, 16.761119842529297, 17.65984535217285, 18.558570861816406, 19.457298278808594, 20.35602378845215, 21.254749298095703, 22.15347671508789, 23.052202224731445, 23.950927734375, 24.849655151367188, 25.748380661010742, 26.647106170654297, 27.545833587646484, 28.44455909729004, 29.343284606933594, 30.24201202392578]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 8.0, 4.0, 16.0, 13.0, 14.0, 18.0, 25.0, 32.0, 31.0, 46.0, 48.0, 46.0, 52.0, 44.0, 62.0, 56.0, 44.0, 55.0, 42.0, 46.0, 34.0, 46.0, 38.0, 24.0, 22.0, 17.0, 18.0, 16.0, 22.0, 8.0, 14.0, 3.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.156768798828125, -3.03424072265625, -2.911712646484375, -2.7891845703125, -2.666656494140625, -2.54412841796875, -2.421600341796875, -2.299072265625, -2.176544189453125, -2.05401611328125, -1.931488037109375, -1.8089599609375, -1.686431884765625, -1.56390380859375, -1.441375732421875, -1.31884765625, -1.196319580078125, -1.07379150390625, -0.951263427734375, -0.8287353515625, -0.706207275390625, -0.58367919921875, -0.461151123046875, -0.338623046875, -0.216094970703125, -0.09356689453125, 0.028961181640625, 0.1514892578125, 0.274017333984375, 0.39654541015625, 0.519073486328125, 0.6416015625, 0.764129638671875, 0.88665771484375, 1.009185791015625, 1.1317138671875, 1.254241943359375, 1.37677001953125, 1.499298095703125, 1.621826171875, 1.744354248046875, 1.86688232421875, 1.989410400390625, 2.1119384765625, 2.234466552734375, 2.35699462890625, 2.479522705078125, 2.60205078125, 2.724578857421875, 2.84710693359375, 2.969635009765625, 3.0921630859375, 3.214691162109375, 3.33721923828125, 3.459747314453125, 3.582275390625, 3.704803466796875, 3.82733154296875, 3.949859619140625, 4.0723876953125, 4.194915771484375, 4.31744384765625, 4.439971923828125, 4.5625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 2.0, 5.0, 10.0, 8.0, 18.0, 9.0, 14.0, 33.0, 52.0, 74.0, 132.0, 229.0, 491.0, 1017.0, 2650.0, 7786.0, 31168.0, 185634.0, 1792114.0, 1926442.0, 200362.0, 33024.0, 8143.0, 2714.0, 1036.0, 480.0, 233.0, 128.0, 79.0, 55.0, 33.0, 16.0, 25.0, 12.0, 10.0, 3.0, 4.0, 7.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.516357421875, -8.21240234375, -7.908447265625, -7.6044921875, -7.300537109375, -6.99658203125, -6.692626953125, -6.388671875, -6.084716796875, -5.78076171875, -5.476806640625, -5.1728515625, -4.868896484375, -4.56494140625, -4.260986328125, -3.95703125, -3.653076171875, -3.34912109375, -3.045166015625, -2.7412109375, -2.437255859375, -2.13330078125, -1.829345703125, -1.525390625, -1.221435546875, -0.91748046875, -0.613525390625, -0.3095703125, -0.005615234375, 0.29833984375, 0.602294921875, 0.90625, 1.210205078125, 1.51416015625, 1.818115234375, 2.1220703125, 2.426025390625, 2.72998046875, 3.033935546875, 3.337890625, 3.641845703125, 3.94580078125, 4.249755859375, 4.5537109375, 4.857666015625, 5.16162109375, 5.465576171875, 5.76953125, 6.073486328125, 6.37744140625, 6.681396484375, 6.9853515625, 7.289306640625, 7.59326171875, 7.897216796875, 8.201171875, 8.505126953125, 8.80908203125, 9.113037109375, 9.4169921875, 9.720947265625, 10.02490234375, 10.328857421875, 10.6328125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 6.0, 7.0, 10.0, 5.0, 7.0, 20.0, 25.0, 37.0, 48.0, 74.0, 99.0, 114.0, 162.0, 232.0, 330.0, 421.0, 465.0, 475.0, 383.0, 300.0, 219.0, 150.0, 117.0, 95.0, 68.0, 64.0, 29.0, 34.0, 22.0, 16.0, 8.0, 12.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.3575439453125, -6.129150390625, -5.9007568359375, -5.67236328125, -5.4439697265625, -5.215576171875, -4.9871826171875, -4.7587890625, -4.5303955078125, -4.302001953125, -4.0736083984375, -3.84521484375, -3.6168212890625, -3.388427734375, -3.1600341796875, -2.931640625, -2.7032470703125, -2.474853515625, -2.2464599609375, -2.01806640625, -1.7896728515625, -1.561279296875, -1.3328857421875, -1.1044921875, -0.8760986328125, -0.647705078125, -0.4193115234375, -0.19091796875, 0.0374755859375, 0.265869140625, 0.4942626953125, 0.72265625, 0.9510498046875, 1.179443359375, 1.4078369140625, 1.63623046875, 1.8646240234375, 2.093017578125, 2.3214111328125, 2.5498046875, 2.7781982421875, 3.006591796875, 3.2349853515625, 3.46337890625, 3.6917724609375, 3.920166015625, 4.1485595703125, 4.376953125, 4.6053466796875, 4.833740234375, 5.0621337890625, 5.29052734375, 5.5189208984375, 5.747314453125, 5.9757080078125, 6.2041015625, 6.4324951171875, 6.660888671875, 6.8892822265625, 7.11767578125, 7.3460693359375, 7.574462890625, 7.8028564453125, 8.03125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 12.0, 7.0, 23.0, 23.0, 29.0, 43.0, 80.0, 101.0, 135.0, 186.0, 324.0, 797.0, 2703.0, 22322.0, 421815.0, 3450751.0, 274905.0, 16353.0, 2148.0, 669.0, 319.0, 190.0, 93.0, 68.0, 53.0, 33.0, 32.0, 16.0, 8.0, 11.0, 7.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.09375, -24.405029296875, -23.71630859375, -23.027587890625, -22.3388671875, -21.650146484375, -20.96142578125, -20.272705078125, -19.583984375, -18.895263671875, -18.20654296875, -17.517822265625, -16.8291015625, -16.140380859375, -15.45166015625, -14.762939453125, -14.07421875, -13.385498046875, -12.69677734375, -12.008056640625, -11.3193359375, -10.630615234375, -9.94189453125, -9.253173828125, -8.564453125, -7.875732421875, -7.18701171875, -6.498291015625, -5.8095703125, -5.120849609375, -4.43212890625, -3.743408203125, -3.0546875, -2.365966796875, -1.67724609375, -0.988525390625, -0.2998046875, 0.388916015625, 1.07763671875, 1.766357421875, 2.455078125, 3.143798828125, 3.83251953125, 4.521240234375, 5.2099609375, 5.898681640625, 6.58740234375, 7.276123046875, 7.96484375, 8.653564453125, 9.34228515625, 10.031005859375, 10.7197265625, 11.408447265625, 12.09716796875, 12.785888671875, 13.474609375, 14.163330078125, 14.85205078125, 15.540771484375, 16.2294921875, 16.918212890625, 17.60693359375, 18.295654296875, 18.984375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 29.0, 80.0, 118.0, 182.0, 205.0, 181.0, 114.0, 59.0, 27.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.81019592285156, -94.28641510009766, -91.76264190673828, -89.23886108398438, -86.715087890625, -84.1913070678711, -81.66752624511719, -79.14375305175781, -76.6199722290039, -74.09619140625, -71.57241821289062, -69.04863739013672, -66.52486419677734, -64.00108337402344, -61.4773063659668, -58.953529357910156, -56.429752349853516, -53.905975341796875, -51.382198333740234, -48.858421325683594, -46.33464050292969, -43.81086349487305, -41.287086486816406, -38.7633056640625, -36.239532470703125, -33.715755462646484, -31.19197654724121, -28.66819953918457, -26.144420623779297, -23.620643615722656, -21.096866607666016, -18.573087692260742, -16.04930877685547, -13.525530815124512, -11.001752853393555, -8.477975845336914, -5.954197883605957, -3.430419921875, -0.9066429138183594, 1.617136001586914, 4.140913009643555, 6.664690971374512, 9.188468933105469, 11.71224594116211, 14.236023902893066, 16.759801864624023, 19.283578872680664, 21.807357788085938, 24.331134796142578, 26.85491180419922, 29.378690719604492, 31.902467727661133, 34.426246643066406, 36.95002365112305, 39.47380065917969, 41.997581481933594, 44.52135467529297, 47.04513168334961, 49.56890869140625, 52.092689514160156, 54.6164665222168, 57.14024353027344, 59.66402053833008, 62.18779754638672, 64.71157836914062]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 17.0, 16.0, 11.0, 16.0, 21.0, 18.0, 22.0, 19.0, 23.0, 26.0, 26.0, 30.0, 39.0, 34.0, 38.0, 44.0, 42.0, 46.0, 49.0, 27.0, 39.0, 29.0, 37.0, 32.0, 41.0, 35.0, 24.0, 17.0, 26.0, 23.0, 21.0, 19.0, 11.0, 12.0, 14.0, 9.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.831104278564453, -24.10629653930664, -23.381488800048828, -22.656681060791016, -21.931873321533203, -21.20706558227539, -20.482257843017578, -19.757450103759766, -19.032642364501953, -18.30783462524414, -17.583026885986328, -16.858219146728516, -16.133411407470703, -15.40860366821289, -14.683795928955078, -13.958988189697266, -13.234179496765137, -12.509371757507324, -11.784564018249512, -11.0597562789917, -10.334948539733887, -9.610140800476074, -8.885332107543945, -8.160524368286133, -7.4357171058654785, -6.710909366607666, -5.9861016273498535, -5.261293411254883, -4.53648567199707, -3.811678171157837, -3.0868701934814453, -2.362062454223633, -1.6372547149658203, -0.912446916103363, -0.18763911724090576, 0.5371687412261963, 1.2619764804840088, 1.9867842197418213, 2.711592197418213, 3.4363999366760254, 4.161207675933838, 4.88601541519165, 5.610823154449463, 6.335631370544434, 7.060439109802246, 7.785246849060059, 8.510054588317871, 9.234862327575684, 9.959670066833496, 10.684477806091309, 11.409285545349121, 12.134093284606934, 12.858901023864746, 13.583708763122559, 14.308517456054688, 15.0333251953125, 15.758132934570312, 16.482940673828125, 17.207748413085938, 17.93255615234375, 18.657363891601562, 19.382171630859375, 20.106979370117188, 20.831787109375, 21.556594848632812]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 7.0, 5.0, 9.0, 9.0, 18.0, 10.0, 29.0, 19.0, 33.0, 42.0, 41.0, 48.0, 43.0, 43.0, 44.0, 55.0, 45.0, 41.0, 52.0, 42.0, 44.0, 37.0, 45.0, 28.0, 31.0, 16.0, 29.0, 12.0, 26.0, 17.0, 12.0, 8.0, 8.0, 8.0, 13.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.283203125, -3.169342041015625, -3.05548095703125, -2.941619873046875, -2.8277587890625, -2.713897705078125, -2.60003662109375, -2.486175537109375, -2.372314453125, -2.258453369140625, -2.14459228515625, -2.030731201171875, -1.9168701171875, -1.803009033203125, -1.68914794921875, -1.575286865234375, -1.46142578125, -1.347564697265625, -1.23370361328125, -1.119842529296875, -1.0059814453125, -0.892120361328125, -0.77825927734375, -0.664398193359375, -0.550537109375, -0.436676025390625, -0.32281494140625, -0.208953857421875, -0.0950927734375, 0.018768310546875, 0.13262939453125, 0.246490478515625, 0.3603515625, 0.474212646484375, 0.58807373046875, 0.701934814453125, 0.8157958984375, 0.929656982421875, 1.04351806640625, 1.157379150390625, 1.271240234375, 1.385101318359375, 1.49896240234375, 1.612823486328125, 1.7266845703125, 1.840545654296875, 1.95440673828125, 2.068267822265625, 2.18212890625, 2.295989990234375, 2.40985107421875, 2.523712158203125, 2.6375732421875, 2.751434326171875, 2.86529541015625, 2.979156494140625, 3.093017578125, 3.206878662109375, 3.32073974609375, 3.434600830078125, 3.5484619140625, 3.662322998046875, 3.77618408203125, 3.890045166015625, 4.00390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 12.0, 12.0, 27.0, 37.0, 43.0, 75.0, 87.0, 171.0, 246.0, 333.0, 514.0, 781.0, 1209.0, 1931.0, 2860.0, 4622.0, 7408.0, 12319.0, 20959.0, 36844.0, 68172.0, 138730.0, 368442.0, 188788.0, 85140.0, 45156.0, 24885.0, 14652.0, 8913.0, 5456.0, 3322.0, 2244.0, 1419.0, 911.0, 598.0, 401.0, 264.0, 193.0, 120.0, 86.0, 50.0, 35.0, 29.0, 17.0, 15.0, 6.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2717704772949219, -0.26229095458984375, -0.2528114318847656, -0.2433319091796875, -0.23385238647460938, -0.22437286376953125, -0.21489334106445312, -0.205413818359375, -0.19593429565429688, -0.18645477294921875, -0.17697525024414062, -0.1674957275390625, -0.15801620483398438, -0.14853668212890625, -0.13905715942382812, -0.12957763671875, -0.12009811401367188, -0.11061859130859375, -0.10113906860351562, -0.0916595458984375, -0.08218002319335938, -0.07270050048828125, -0.06322097778320312, -0.053741455078125, -0.044261932373046875, -0.03478240966796875, -0.025302886962890625, -0.0158233642578125, -0.006343841552734375, 0.00313568115234375, 0.012615203857421875, 0.0220947265625, 0.031574249267578125, 0.04105377197265625, 0.050533294677734375, 0.0600128173828125, 0.06949234008789062, 0.07897186279296875, 0.08845138549804688, 0.097930908203125, 0.10741043090820312, 0.11688995361328125, 0.12636947631835938, 0.1358489990234375, 0.14532852172851562, 0.15480804443359375, 0.16428756713867188, 0.17376708984375, 0.18324661254882812, 0.19272613525390625, 0.20220565795898438, 0.2116851806640625, 0.22116470336914062, 0.23064422607421875, 0.24012374877929688, 0.249603271484375, 0.2590827941894531, 0.26856231689453125, 0.2780418395996094, 0.2875213623046875, 0.2970008850097656, 0.30648040771484375, 0.3159599304199219, 0.325439453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 11.0, 8.0, 11.0, 5.0, 8.0, 10.0, 17.0, 21.0, 19.0, 17.0, 20.0, 17.0, 26.0, 29.0, 27.0, 29.0, 34.0, 36.0, 28.0, 35.0, 33.0, 41.0, 1066.0, 43.0, 35.0, 27.0, 34.0, 32.0, 31.0, 23.0, 24.0, 31.0, 21.0, 29.0, 31.0, 16.0, 21.0, 12.0, 9.0, 14.0, 14.0, 3.0, 11.0, 3.0, 8.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.3828125, -2.315155029296875, -2.24749755859375, -2.179840087890625, -2.1121826171875, -2.044525146484375, -1.97686767578125, -1.909210205078125, -1.841552734375, -1.773895263671875, -1.70623779296875, -1.638580322265625, -1.5709228515625, -1.503265380859375, -1.43560791015625, -1.367950439453125, -1.30029296875, -1.232635498046875, -1.16497802734375, -1.097320556640625, -1.0296630859375, -0.962005615234375, -0.89434814453125, -0.826690673828125, -0.759033203125, -0.691375732421875, -0.62371826171875, -0.556060791015625, -0.4884033203125, -0.420745849609375, -0.35308837890625, -0.285430908203125, -0.2177734375, -0.150115966796875, -0.08245849609375, -0.014801025390625, 0.0528564453125, 0.120513916015625, 0.18817138671875, 0.255828857421875, 0.323486328125, 0.391143798828125, 0.45880126953125, 0.526458740234375, 0.5941162109375, 0.661773681640625, 0.72943115234375, 0.797088623046875, 0.86474609375, 0.932403564453125, 1.00006103515625, 1.067718505859375, 1.1353759765625, 1.203033447265625, 1.27069091796875, 1.338348388671875, 1.406005859375, 1.473663330078125, 1.54132080078125, 1.608978271484375, 1.6766357421875, 1.744293212890625, 1.81195068359375, 1.879608154296875, 1.947265625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 30.0, 28.0, 45.0, 45.0, 100.0, 146.0, 170.0, 247.0, 386.0, 598.0, 913.0, 1267.0, 1938.0, 2749.0, 4379.0, 6705.0, 10038.0, 15671.0, 25212.0, 40795.0, 69921.0, 134893.0, 1405448.0, 167623.0, 81708.0, 47072.0, 28195.0, 17500.0, 11256.0, 7368.0, 4740.0, 3231.0, 2148.0, 1445.0, 966.0, 672.0, 435.0, 327.0, 212.0, 151.0, 111.0, 71.0, 37.0, 44.0, 22.0, 19.0, 16.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.136474609375, -0.1318683624267578, -0.12726211547851562, -0.12265586853027344, -0.11804962158203125, -0.11344337463378906, -0.10883712768554688, -0.10423088073730469, -0.0996246337890625, -0.09501838684082031, -0.09041213989257812, -0.08580589294433594, -0.08119964599609375, -0.07659339904785156, -0.07198715209960938, -0.06738090515136719, -0.062774658203125, -0.05816841125488281, -0.053562164306640625, -0.04895591735839844, -0.04434967041015625, -0.03974342346191406, -0.035137176513671875, -0.030530929565429688, -0.0259246826171875, -0.021318435668945312, -0.016712188720703125, -0.012105941772460938, -0.00749969482421875, -0.0028934478759765625, 0.001712799072265625, 0.0063190460205078125, 0.01092529296875, 0.015531539916992188, 0.020137786865234375, 0.024744033813476562, 0.02935028076171875, 0.03395652770996094, 0.038562774658203125, 0.04316902160644531, 0.0477752685546875, 0.05238151550292969, 0.056987762451171875, 0.06159400939941406, 0.06620025634765625, 0.07080650329589844, 0.07541275024414062, 0.08001899719238281, 0.084625244140625, 0.08923149108886719, 0.09383773803710938, 0.09844398498535156, 0.10305023193359375, 0.10765647888183594, 0.11226272583007812, 0.11686897277832031, 0.1214752197265625, 0.1260814666748047, 0.13068771362304688, 0.13529396057128906, 0.13990020751953125, 0.14450645446777344, 0.14911270141601562, 0.1537189483642578, 0.1583251953125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 8.0, 14.0, 11.0, 13.0, 8.0, 23.0, 15.0, 18.0, 26.0, 37.0, 58.0, 72.0, 159.0, 133.0, 107.0, 82.0, 40.0, 38.0, 31.0, 13.0, 22.0, 15.0, 12.0, 5.0, 12.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3066997528076172e-05, -2.2328458726406097e-05, -2.1589919924736023e-05, -2.085138112306595e-05, -2.0112842321395874e-05, -1.93743035197258e-05, -1.8635764718055725e-05, -1.789722591638565e-05, -1.7158687114715576e-05, -1.6420148313045502e-05, -1.5681609511375427e-05, -1.4943070709705353e-05, -1.4204531908035278e-05, -1.3465993106365204e-05, -1.272745430469513e-05, -1.1988915503025055e-05, -1.125037670135498e-05, -1.0511837899684906e-05, -9.773299098014832e-06, -9.034760296344757e-06, -8.296221494674683e-06, -7.557682693004608e-06, -6.819143891334534e-06, -6.080605089664459e-06, -5.342066287994385e-06, -4.60352748632431e-06, -3.864988684654236e-06, -3.1264498829841614e-06, -2.387911081314087e-06, -1.6493722796440125e-06, -9.10833477973938e-07, -1.7229467630386353e-07, 5.662441253662109e-07, 1.3047829270362854e-06, 2.04332172870636e-06, 2.7818605303764343e-06, 3.520399332046509e-06, 4.258938133716583e-06, 4.997476935386658e-06, 5.736015737056732e-06, 6.474554538726807e-06, 7.213093340396881e-06, 7.951632142066956e-06, 8.69017094373703e-06, 9.428709745407104e-06, 1.0167248547077179e-05, 1.0905787348747253e-05, 1.1644326150417328e-05, 1.2382864952087402e-05, 1.3121403753757477e-05, 1.3859942555427551e-05, 1.4598481357097626e-05, 1.53370201587677e-05, 1.6075558960437775e-05, 1.681409776210785e-05, 1.7552636563777924e-05, 1.8291175365447998e-05, 1.9029714167118073e-05, 1.9768252968788147e-05, 2.050679177045822e-05, 2.1245330572128296e-05, 2.198386937379837e-05, 2.2722408175468445e-05, 2.346094697713852e-05, 2.4199485778808594e-05]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 16.0, 13.0, 18.0, 29.0, 31.0, 64.0, 93.0, 204.0, 893.0, 7601.0, 126039.0, 863153.0, 45895.0, 3507.0, 531.0, 162.0, 74.0, 47.0, 35.0, 26.0, 14.0, 14.0, 17.0, 11.0, 8.0, 3.0, 10.0, 6.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035643577575683594, -0.00034541264176368713, -0.00033438950777053833, -0.0003233663737773895, -0.0003123432397842407, -0.0003013201057910919, -0.0002902969717979431, -0.0002792738378047943, -0.0002682507038116455, -0.0002572275698184967, -0.0002462044358253479, -0.0002351813018321991, -0.0002241581678390503, -0.0002131350338459015, -0.00020211189985275269, -0.00019108876585960388, -0.00018006563186645508, -0.00016904249787330627, -0.00015801936388015747, -0.00014699622988700867, -0.00013597309589385986, -0.00012494996190071106, -0.00011392682790756226, -0.00010290369391441345, -9.188055992126465e-05, -8.085742592811584e-05, -6.983429193496704e-05, -5.881115794181824e-05, -4.7788023948669434e-05, -3.676488995552063e-05, -2.5741755962371826e-05, -1.4718621969223022e-05, -3.6954879760742188e-06, 7.327646017074585e-06, 1.835078001022339e-05, 2.9373914003372192e-05, 4.0397047996520996e-05, 5.14201819896698e-05, 6.24433159828186e-05, 7.346644997596741e-05, 8.448958396911621e-05, 9.551271796226501e-05, 0.00010653585195541382, 0.00011755898594856262, 0.00012858211994171143, 0.00013960525393486023, 0.00015062838792800903, 0.00016165152192115784, 0.00017267465591430664, 0.00018369778990745544, 0.00019472092390060425, 0.00020574405789375305, 0.00021676719188690186, 0.00022779032588005066, 0.00023881345987319946, 0.00024983659386634827, 0.00026085972785949707, 0.0002718828618526459, 0.0002829059958457947, 0.0002939291298389435, 0.0003049522638320923, 0.0003159753978252411, 0.0003269985318183899, 0.0003380216658115387, 0.0003490447998046875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 26.0, 44.0, 148.0, 257.0, 276.0, 147.0, 64.0, 23.0, 12.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0825582396355458e-05, -1.910160790430382e-05, -1.737763341225218e-05, -1.565365892020054e-05, -1.3929683518654201e-05, -1.2205709026602563e-05, -1.0481733625056222e-05, -8.757759133004583e-06, -7.033784640952945e-06, -5.309810148901306e-06, -3.5858352021023165e-06, -1.861860255303327e-06, -1.3788576325168833e-07, 1.5860887287999503e-06, 3.3100641303462908e-06, 5.0340386223979294e-06, 6.758013114449568e-06, 8.481987606501207e-06, 1.0205962098552845e-05, 1.1929937500099186e-05, 1.3653911992150825e-05, 1.537788557470776e-05, 1.7101861885748804e-05, 1.8825836377800442e-05, 2.054981086985208e-05, 2.227378536190372e-05, 2.3997759853955358e-05, 2.57217361649964e-05, 2.7445708838058636e-05, 2.9169685149099678e-05, 3.089365782216191e-05, 3.2617634133202955e-05, 3.4341610444244e-05, 3.606558675528504e-05, 3.7789559428347275e-05, 3.951353573938832e-05, 4.123750841245055e-05, 4.2961484723491594e-05, 4.4685461034532636e-05, 4.640943370759487e-05, 4.813340638065711e-05, 4.985738269169815e-05, 5.1581355364760384e-05, 5.3305331675801426e-05, 5.502930434886366e-05, 5.6753280659904703e-05, 5.8477256970945746e-05, 6.020122964400798e-05, 6.192520959302783e-05, 6.364918226609007e-05, 6.537316221510991e-05, 6.709713488817215e-05, 6.882110756123438e-05, 7.054508023429662e-05, 7.226906018331647e-05, 7.39930328563787e-05, 7.571700552944094e-05, 7.744097820250317e-05, 7.916495815152302e-05, 8.088893082458526e-05, 8.26129034976475e-05, 8.433687617070973e-05, 8.606085611972958e-05, 8.778482879279181e-05, 8.950880146585405e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 3.0, 5.0, 6.0, 8.0, 11.0, 11.0, 11.0, 16.0, 17.0, 16.0, 16.0, 18.0, 31.0, 33.0, 38.0, 35.0, 34.0, 41.0, 38.0, 58.0, 40.0, 48.0, 37.0, 40.0, 31.0, 35.0, 46.0, 37.0, 31.0, 41.0, 22.0, 29.0, 22.0, 25.0, 10.0, 7.0, 12.0, 8.0, 9.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.1444091796875e-05, -1.1137686669826508e-05, -1.0831281542778015e-05, -1.0524876415729523e-05, -1.021847128868103e-05, -9.912066161632538e-06, -9.605661034584045e-06, -9.299255907535553e-06, -8.99285078048706e-06, -8.686445653438568e-06, -8.380040526390076e-06, -8.073635399341583e-06, -7.76723027229309e-06, -7.460825145244598e-06, -7.154420018196106e-06, -6.8480148911476135e-06, -6.541609764099121e-06, -6.235204637050629e-06, -5.928799510002136e-06, -5.622394382953644e-06, -5.315989255905151e-06, -5.009584128856659e-06, -4.7031790018081665e-06, -4.396773874759674e-06, -4.090368747711182e-06, -3.783963620662689e-06, -3.4775584936141968e-06, -3.1711533665657043e-06, -2.864748239517212e-06, -2.5583431124687195e-06, -2.251937985420227e-06, -1.9455328583717346e-06, -1.6391277313232422e-06, -1.3327226042747498e-06, -1.0263174772262573e-06, -7.199123501777649e-07, -4.1350722312927246e-07, -1.0710209608078003e-07, 1.993030309677124e-07, 5.057081580162048e-07, 8.121132850646973e-07, 1.1185184121131897e-06, 1.4249235391616821e-06, 1.7313286662101746e-06, 2.037733793258667e-06, 2.3441389203071594e-06, 2.650544047355652e-06, 2.9569491744041443e-06, 3.2633543014526367e-06, 3.569759428501129e-06, 3.876164555549622e-06, 4.182569682598114e-06, 4.4889748096466064e-06, 4.795379936695099e-06, 5.101785063743591e-06, 5.408190190792084e-06, 5.714595317840576e-06, 6.021000444889069e-06, 6.327405571937561e-06, 6.6338106989860535e-06, 6.940215826034546e-06, 7.246620953083038e-06, 7.553026080131531e-06, 7.859431207180023e-06, 8.165836334228516e-06]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 7.0, 5.0, 9.0, 9.0, 18.0, 10.0, 29.0, 19.0, 33.0, 42.0, 41.0, 48.0, 43.0, 43.0, 44.0, 55.0, 45.0, 41.0, 52.0, 42.0, 44.0, 37.0, 45.0, 28.0, 31.0, 16.0, 29.0, 12.0, 26.0, 17.0, 12.0, 8.0, 8.0, 8.0, 13.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.283203125, -3.169342041015625, -3.05548095703125, -2.941619873046875, -2.8277587890625, -2.713897705078125, -2.60003662109375, -2.486175537109375, -2.372314453125, -2.258453369140625, -2.14459228515625, -2.030731201171875, -1.9168701171875, -1.803009033203125, -1.68914794921875, -1.575286865234375, -1.46142578125, -1.347564697265625, -1.23370361328125, -1.119842529296875, -1.0059814453125, -0.892120361328125, -0.77825927734375, -0.664398193359375, -0.550537109375, -0.436676025390625, -0.32281494140625, -0.208953857421875, -0.0950927734375, 0.018768310546875, 0.13262939453125, 0.246490478515625, 0.3603515625, 0.474212646484375, 0.58807373046875, 0.701934814453125, 0.8157958984375, 0.929656982421875, 1.04351806640625, 1.157379150390625, 1.271240234375, 1.385101318359375, 1.49896240234375, 1.612823486328125, 1.7266845703125, 1.840545654296875, 1.95440673828125, 2.068267822265625, 2.18212890625, 2.295989990234375, 2.40985107421875, 2.523712158203125, 2.6375732421875, 2.751434326171875, 2.86529541015625, 2.979156494140625, 3.093017578125, 3.206878662109375, 3.32073974609375, 3.434600830078125, 3.5484619140625, 3.662322998046875, 3.77618408203125, 3.890045166015625, 4.00390625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 8.0, 11.0, 19.0, 34.0, 56.0, 86.0, 135.0, 203.0, 337.0, 575.0, 853.0, 1403.0, 2204.0, 4082.0, 7538.0, 15518.0, 34000.0, 80762.0, 229331.0, 419303.0, 146521.0, 55641.0, 24389.0, 11672.0, 5734.0, 3227.0, 1861.0, 1129.0, 715.0, 445.0, 295.0, 154.0, 115.0, 75.0, 44.0, 32.0, 17.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.1221923828125, -3.990478515625, -3.8587646484375, -3.72705078125, -3.5953369140625, -3.463623046875, -3.3319091796875, -3.2001953125, -3.0684814453125, -2.936767578125, -2.8050537109375, -2.67333984375, -2.5416259765625, -2.409912109375, -2.2781982421875, -2.146484375, -2.0147705078125, -1.883056640625, -1.7513427734375, -1.61962890625, -1.4879150390625, -1.356201171875, -1.2244873046875, -1.0927734375, -0.9610595703125, -0.829345703125, -0.6976318359375, -0.56591796875, -0.4342041015625, -0.302490234375, -0.1707763671875, -0.0390625, 0.0926513671875, 0.224365234375, 0.3560791015625, 0.48779296875, 0.6195068359375, 0.751220703125, 0.8829345703125, 1.0146484375, 1.1463623046875, 1.278076171875, 1.4097900390625, 1.54150390625, 1.6732177734375, 1.804931640625, 1.9366455078125, 2.068359375, 2.2000732421875, 2.331787109375, 2.4635009765625, 2.59521484375, 2.7269287109375, 2.858642578125, 2.9903564453125, 3.1220703125, 3.2537841796875, 3.385498046875, 3.5172119140625, 3.64892578125, 3.7806396484375, 3.912353515625, 4.0440673828125, 4.17578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 9.0, 12.0, 6.0, 18.0, 14.0, 24.0, 22.0, 26.0, 34.0, 31.0, 38.0, 38.0, 50.0, 81.0, 144.0, 395.0, 1504.0, 139.0, 82.0, 65.0, 47.0, 38.0, 29.0, 35.0, 26.0, 29.0, 17.0, 15.0, 11.0, 9.0, 13.0, 8.0, 6.0, 9.0, 7.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.5152587890625, -11.132080078125, -10.7489013671875, -10.36572265625, -9.9825439453125, -9.599365234375, -9.2161865234375, -8.8330078125, -8.4498291015625, -8.066650390625, -7.6834716796875, -7.30029296875, -6.9171142578125, -6.533935546875, -6.1507568359375, -5.767578125, -5.3843994140625, -5.001220703125, -4.6180419921875, -4.23486328125, -3.8516845703125, -3.468505859375, -3.0853271484375, -2.7021484375, -2.3189697265625, -1.935791015625, -1.5526123046875, -1.16943359375, -0.7862548828125, -0.403076171875, -0.0198974609375, 0.36328125, 0.7464599609375, 1.129638671875, 1.5128173828125, 1.89599609375, 2.2791748046875, 2.662353515625, 3.0455322265625, 3.4287109375, 3.8118896484375, 4.195068359375, 4.5782470703125, 4.96142578125, 5.3446044921875, 5.727783203125, 6.1109619140625, 6.494140625, 6.8773193359375, 7.260498046875, 7.6436767578125, 8.02685546875, 8.4100341796875, 8.793212890625, 9.1763916015625, 9.5595703125, 9.9427490234375, 10.325927734375, 10.7091064453125, 11.09228515625, 11.4754638671875, 11.858642578125, 12.2418212890625, 12.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 6.0, 7.0, 11.0, 12.0, 19.0, 26.0, 23.0, 43.0, 54.0, 74.0, 114.0, 154.0, 203.0, 365.0, 1110.0, 7116.0, 257622.0, 2849347.0, 25400.0, 2560.0, 526.0, 255.0, 163.0, 125.0, 102.0, 77.0, 49.0, 39.0, 25.0, 20.0, 16.0, 10.0, 9.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.717529296875, -22.98193359375, -22.246337890625, -21.5107421875, -20.775146484375, -20.03955078125, -19.303955078125, -18.568359375, -17.832763671875, -17.09716796875, -16.361572265625, -15.6259765625, -14.890380859375, -14.15478515625, -13.419189453125, -12.68359375, -11.947998046875, -11.21240234375, -10.476806640625, -9.7412109375, -9.005615234375, -8.27001953125, -7.534423828125, -6.798828125, -6.063232421875, -5.32763671875, -4.592041015625, -3.8564453125, -3.120849609375, -2.38525390625, -1.649658203125, -0.9140625, -0.178466796875, 0.55712890625, 1.292724609375, 2.0283203125, 2.763916015625, 3.49951171875, 4.235107421875, 4.970703125, 5.706298828125, 6.44189453125, 7.177490234375, 7.9130859375, 8.648681640625, 9.38427734375, 10.119873046875, 10.85546875, 11.591064453125, 12.32666015625, 13.062255859375, 13.7978515625, 14.533447265625, 15.26904296875, 16.004638671875, 16.740234375, 17.475830078125, 18.21142578125, 18.947021484375, 19.6826171875, 20.418212890625, 21.15380859375, 21.889404296875, 22.625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 9.0, 38.0, 99.0, 172.0, 218.0, 208.0, 149.0, 68.0, 35.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.45821762084961, -17.219425201416016, -15.980631828308105, -14.741838455200195, -13.503046035766602, -12.264253616333008, -11.025460243225098, -9.786666870117188, -8.547874450683594, -7.309081554412842, -6.07028865814209, -4.831495761871338, -3.592702865600586, -2.353909969329834, -1.115117073059082, 0.12367630004882812, 1.3624687194824219, 2.601261615753174, 3.840054512023926, 5.078847408294678, 6.31764030456543, 7.556433200836182, 8.795226097106934, 10.034019470214844, 11.272811889648438, 12.511604309082031, 13.750397682189941, 14.989191055297852, 16.227983474731445, 17.46677589416504, 18.705570220947266, 19.94436264038086, 21.18315887451172, 22.421951293945312, 23.660743713378906, 24.899538040161133, 26.138330459594727, 27.37712287902832, 28.615917205810547, 29.85470962524414, 31.093502044677734, 32.33229446411133, 33.57108688354492, 34.809879302978516, 36.048675537109375, 37.28746795654297, 38.52626037597656, 39.765052795410156, 41.00384521484375, 42.242637634277344, 43.48143005371094, 44.72022247314453, 45.959014892578125, 47.197811126708984, 48.43660354614258, 49.67539596557617, 50.914188385009766, 52.15298080444336, 53.39177322387695, 54.63056564331055, 55.869361877441406, 57.108154296875, 58.346946716308594, 59.58573913574219, 60.82453155517578]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 2.0, 19.0, 12.0, 13.0, 7.0, 17.0, 29.0, 16.0, 24.0, 25.0, 37.0, 33.0, 30.0, 39.0, 38.0, 39.0, 44.0, 36.0, 39.0, 40.0, 41.0, 51.0, 47.0, 33.0, 38.0, 28.0, 35.0, 23.0, 25.0, 27.0, 12.0, 17.0, 14.0, 15.0, 10.0, 12.0, 9.0, 2.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.07946014404297, -29.098413467407227, -28.117366790771484, -27.13631820678711, -26.155271530151367, -25.174224853515625, -24.193178176879883, -23.21213150024414, -22.2310848236084, -21.250038146972656, -20.268991470336914, -19.287944793701172, -18.306896209716797, -17.325849533081055, -16.344802856445312, -15.36375617980957, -14.382708549499512, -13.40166187286377, -12.420614242553711, -11.439567565917969, -10.458520889282227, -9.477474212646484, -8.496426582336426, -7.515379905700684, -6.534332752227783, -5.553285598754883, -4.572238922119141, -3.5911917686462402, -2.610144853591919, -1.6290979385375977, -0.6480507850646973, 0.3329958915710449, 1.3140430450439453, 2.2950899600982666, 3.276136875152588, 4.257184028625488, 5.2382307052612305, 6.219277858734131, 7.200325012207031, 8.181371688842773, 9.162418365478516, 10.143465042114258, 11.124512672424316, 12.105559349060059, 13.0866060256958, 14.06765365600586, 15.048700332641602, 16.029747009277344, 17.01079559326172, 17.99184226989746, 18.972888946533203, 19.953937530517578, 20.93498420715332, 21.916030883789062, 22.897077560424805, 23.878124237060547, 24.85917091369629, 25.84021759033203, 26.821264266967773, 27.802310943603516, 28.78335952758789, 29.764406204223633, 30.745452880859375, 31.726499557495117, 32.70754623413086]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 12.0, 5.0, 5.0, 9.0, 6.0, 16.0, 14.0, 28.0, 18.0, 26.0, 35.0, 47.0, 44.0, 46.0, 46.0, 49.0, 34.0, 46.0, 59.0, 45.0, 45.0, 42.0, 44.0, 35.0, 29.0, 30.0, 28.0, 21.0, 20.0, 18.0, 18.0, 20.0, 12.0, 9.0, 3.0, 8.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.395416259765625, -3.27911376953125, -3.162811279296875, -3.0465087890625, -2.930206298828125, -2.81390380859375, -2.697601318359375, -2.581298828125, -2.464996337890625, -2.34869384765625, -2.232391357421875, -2.1160888671875, -1.999786376953125, -1.88348388671875, -1.767181396484375, -1.65087890625, -1.534576416015625, -1.41827392578125, -1.301971435546875, -1.1856689453125, -1.069366455078125, -0.95306396484375, -0.836761474609375, -0.720458984375, -0.604156494140625, -0.48785400390625, -0.371551513671875, -0.2552490234375, -0.138946533203125, -0.02264404296875, 0.093658447265625, 0.2099609375, 0.326263427734375, 0.44256591796875, 0.558868408203125, 0.6751708984375, 0.791473388671875, 0.90777587890625, 1.024078369140625, 1.140380859375, 1.256683349609375, 1.37298583984375, 1.489288330078125, 1.6055908203125, 1.721893310546875, 1.83819580078125, 1.954498291015625, 2.07080078125, 2.187103271484375, 2.30340576171875, 2.419708251953125, 2.5360107421875, 2.652313232421875, 2.76861572265625, 2.884918212890625, 3.001220703125, 3.117523193359375, 3.23382568359375, 3.350128173828125, 3.4664306640625, 3.582733154296875, 3.69903564453125, 3.815338134765625, 3.931640625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 10.0, 13.0, 17.0, 29.0, 28.0, 53.0, 73.0, 123.0, 209.0, 333.0, 613.0, 1080.0, 2110.0, 4203.0, 9131.0, 21591.0, 60479.0, 213515.0, 969904.0, 2083793.0, 609669.0, 142354.0, 43852.0, 16615.0, 7203.0, 3387.0, 1735.0, 889.0, 535.0, 278.0, 156.0, 92.0, 65.0, 48.0, 30.0, 28.0, 14.0, 9.0, 9.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01171875, -4.821533203125, -4.63134765625, -4.441162109375, -4.2509765625, -4.060791015625, -3.87060546875, -3.680419921875, -3.490234375, -3.300048828125, -3.10986328125, -2.919677734375, -2.7294921875, -2.539306640625, -2.34912109375, -2.158935546875, -1.96875, -1.778564453125, -1.58837890625, -1.398193359375, -1.2080078125, -1.017822265625, -0.82763671875, -0.637451171875, -0.447265625, -0.257080078125, -0.06689453125, 0.123291015625, 0.3134765625, 0.503662109375, 0.69384765625, 0.884033203125, 1.07421875, 1.264404296875, 1.45458984375, 1.644775390625, 1.8349609375, 2.025146484375, 2.21533203125, 2.405517578125, 2.595703125, 2.785888671875, 2.97607421875, 3.166259765625, 3.3564453125, 3.546630859375, 3.73681640625, 3.927001953125, 4.1171875, 4.307373046875, 4.49755859375, 4.687744140625, 4.8779296875, 5.068115234375, 5.25830078125, 5.448486328125, 5.638671875, 5.828857421875, 6.01904296875, 6.209228515625, 6.3994140625, 6.589599609375, 6.77978515625, 6.969970703125, 7.16015625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 15.0, 12.0, 18.0, 24.0, 30.0, 38.0, 60.0, 107.0, 122.0, 163.0, 229.0, 342.0, 488.0, 556.0, 495.0, 374.0, 299.0, 192.0, 138.0, 98.0, 67.0, 50.0, 35.0, 29.0, 16.0, 15.0, 11.0, 12.0, 10.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.05859375, -6.82049560546875, -6.5823974609375, -6.34429931640625, -6.106201171875, -5.86810302734375, -5.6300048828125, -5.39190673828125, -5.15380859375, -4.91571044921875, -4.6776123046875, -4.43951416015625, -4.201416015625, -3.96331787109375, -3.7252197265625, -3.48712158203125, -3.2490234375, -3.01092529296875, -2.7728271484375, -2.53472900390625, -2.296630859375, -2.05853271484375, -1.8204345703125, -1.58233642578125, -1.34423828125, -1.10614013671875, -0.8680419921875, -0.62994384765625, -0.391845703125, -0.15374755859375, 0.0843505859375, 0.32244873046875, 0.560546875, 0.79864501953125, 1.0367431640625, 1.27484130859375, 1.512939453125, 1.75103759765625, 1.9891357421875, 2.22723388671875, 2.46533203125, 2.70343017578125, 2.9415283203125, 3.17962646484375, 3.417724609375, 3.65582275390625, 3.8939208984375, 4.13201904296875, 4.3701171875, 4.60821533203125, 4.8463134765625, 5.08441162109375, 5.322509765625, 5.56060791015625, 5.7987060546875, 6.03680419921875, 6.27490234375, 6.51300048828125, 6.7510986328125, 6.98919677734375, 7.227294921875, 7.46539306640625, 7.7034912109375, 7.94158935546875, 8.1796875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 15.0, 12.0, 26.0, 19.0, 43.0, 49.0, 79.0, 108.0, 150.0, 266.0, 494.0, 1604.0, 9780.0, 145883.0, 3365071.0, 638796.0, 27133.0, 3111.0, 718.0, 302.0, 181.0, 128.0, 103.0, 54.0, 42.0, 30.0, 20.0, 14.0, 10.0, 7.0, 10.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -23.0087890625, -22.283203125, -21.5576171875, -20.83203125, -20.1064453125, -19.380859375, -18.6552734375, -17.9296875, -17.2041015625, -16.478515625, -15.7529296875, -15.02734375, -14.3017578125, -13.576171875, -12.8505859375, -12.125, -11.3994140625, -10.673828125, -9.9482421875, -9.22265625, -8.4970703125, -7.771484375, -7.0458984375, -6.3203125, -5.5947265625, -4.869140625, -4.1435546875, -3.41796875, -2.6923828125, -1.966796875, -1.2412109375, -0.515625, 0.2099609375, 0.935546875, 1.6611328125, 2.38671875, 3.1123046875, 3.837890625, 4.5634765625, 5.2890625, 6.0146484375, 6.740234375, 7.4658203125, 8.19140625, 8.9169921875, 9.642578125, 10.3681640625, 11.09375, 11.8193359375, 12.544921875, 13.2705078125, 13.99609375, 14.7216796875, 15.447265625, 16.1728515625, 16.8984375, 17.6240234375, 18.349609375, 19.0751953125, 19.80078125, 20.5263671875, 21.251953125, 21.9775390625, 22.703125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 18.0, 32.0, 48.0, 43.0, 82.0, 81.0, 96.0, 133.0, 99.0, 91.0, 83.0, 71.0, 47.0, 30.0, 15.0, 11.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.932220458984375, -42.64853286743164, -41.364845275878906, -40.08115768432617, -38.79747009277344, -37.5137825012207, -36.23009490966797, -34.946407318115234, -33.6627197265625, -32.379032135009766, -31.09534454345703, -29.811656951904297, -28.527969360351562, -27.244281768798828, -25.960594177246094, -24.67690658569336, -23.393220901489258, -22.109533309936523, -20.82584571838379, -19.542158126831055, -18.25847053527832, -16.974782943725586, -15.691096305847168, -14.407408714294434, -13.1237211227417, -11.840033531188965, -10.55634593963623, -9.272659301757812, -7.98897123336792, -6.7052836418151855, -5.421596527099609, -4.137908935546875, -2.8542213439941406, -1.5705338716506958, -0.286846399307251, 0.9968409538269043, 2.2805285453796387, 3.564216136932373, 4.847903251647949, 6.131590843200684, 7.415278434753418, 8.698966026306152, 9.982653617858887, 11.266340255737305, 12.550027847290039, 13.833715438842773, 15.117403030395508, 16.401090621948242, 17.684778213500977, 18.96846580505371, 20.252153396606445, 21.53584098815918, 22.819528579711914, 24.10321617126465, 25.38690185546875, 26.670589447021484, 27.95427703857422, 29.237964630126953, 30.521652221679688, 31.805339813232422, 33.089027404785156, 34.37271499633789, 35.656402587890625, 36.94009017944336, 38.223777770996094]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 4.0, 6.0, 4.0, 3.0, 22.0, 17.0, 9.0, 27.0, 26.0, 27.0, 28.0, 29.0, 35.0, 28.0, 41.0, 36.0, 45.0, 43.0, 36.0, 44.0, 47.0, 45.0, 38.0, 35.0, 31.0, 35.0, 30.0, 25.0, 28.0, 25.0, 19.0, 21.0, 20.0, 11.0, 10.0, 11.0, 14.0, 8.0, 6.0, 5.0, 7.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.45409393310547, -20.752635955810547, -20.051176071166992, -19.34971809387207, -18.64826011657715, -17.946800231933594, -17.245342254638672, -16.54388427734375, -15.842425346374512, -15.140966415405273, -14.439508438110352, -13.738049507141113, -13.036590576171875, -12.335132598876953, -11.633673667907715, -10.932214736938477, -10.230756759643555, -9.529297828674316, -8.827839851379395, -8.126380920410156, -7.424922466278076, -6.723464012145996, -6.022005081176758, -5.320546627044678, -4.619088172912598, -3.9176297187805176, -3.2161710262298584, -2.514712333679199, -1.8132538795471191, -1.111795425415039, -0.4103364944458008, 0.2911219596862793, 0.9925823211669922, 1.6940408945083618, 2.3954994678497314, 3.0969581604003906, 3.7984166145324707, 4.499875068664551, 5.201333999633789, 5.902792453765869, 6.604250907897949, 7.305709362030029, 8.00716781616211, 8.708626747131348, 9.410085678100586, 10.111543655395508, 10.813002586364746, 11.514461517333984, 12.215919494628906, 12.917378425598145, 13.618836402893066, 14.320295333862305, 15.021753311157227, 15.723212242126465, 16.424671173095703, 17.126129150390625, 17.827587127685547, 18.52904510498047, 19.230504989624023, 19.931962966918945, 20.633420944213867, 21.334880828857422, 22.036338806152344, 22.737796783447266, 23.43925666809082]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 10.0, 5.0, 5.0, 10.0, 7.0, 11.0, 19.0, 9.0, 21.0, 28.0, 32.0, 25.0, 42.0, 51.0, 38.0, 50.0, 56.0, 45.0, 35.0, 58.0, 52.0, 45.0, 30.0, 37.0, 38.0, 33.0, 27.0, 25.0, 26.0, 21.0, 18.0, 12.0, 10.0, 15.0, 11.0, 8.0, 7.0, 5.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.10369873046875, -2.9886474609375, -2.87359619140625, -2.758544921875, -2.64349365234375, -2.5284423828125, -2.41339111328125, -2.29833984375, -2.18328857421875, -2.0682373046875, -1.95318603515625, -1.838134765625, -1.72308349609375, -1.6080322265625, -1.49298095703125, -1.3779296875, -1.26287841796875, -1.1478271484375, -1.03277587890625, -0.917724609375, -0.80267333984375, -0.6876220703125, -0.57257080078125, -0.45751953125, -0.34246826171875, -0.2274169921875, -0.11236572265625, 0.002685546875, 0.11773681640625, 0.2327880859375, 0.34783935546875, 0.462890625, 0.57794189453125, 0.6929931640625, 0.80804443359375, 0.923095703125, 1.03814697265625, 1.1531982421875, 1.26824951171875, 1.38330078125, 1.49835205078125, 1.6134033203125, 1.72845458984375, 1.843505859375, 1.95855712890625, 2.0736083984375, 2.18865966796875, 2.3037109375, 2.41876220703125, 2.5338134765625, 2.64886474609375, 2.763916015625, 2.87896728515625, 2.9940185546875, 3.10906982421875, 3.22412109375, 3.33917236328125, 3.4542236328125, 3.56927490234375, 3.684326171875, 3.79937744140625, 3.9144287109375, 4.02947998046875, 4.14453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 12.0, 18.0, 34.0, 36.0, 56.0, 71.0, 112.0, 154.0, 206.0, 303.0, 457.0, 671.0, 929.0, 1360.0, 2032.0, 3036.0, 4550.0, 6942.0, 10849.0, 17657.0, 29611.0, 52136.0, 99890.0, 266745.0, 307780.0, 105928.0, 54524.0, 31044.0, 18322.0, 11399.0, 7296.0, 4674.0, 3079.0, 2040.0, 1455.0, 982.0, 649.0, 462.0, 322.0, 234.0, 159.0, 112.0, 71.0, 38.0, 46.0, 20.0, 17.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2975959777832031, -0.28830718994140625, -0.2790184020996094, -0.2697296142578125, -0.2604408264160156, -0.25115203857421875, -0.24186325073242188, -0.232574462890625, -0.22328567504882812, -0.21399688720703125, -0.20470809936523438, -0.1954193115234375, -0.18613052368164062, -0.17684173583984375, -0.16755294799804688, -0.15826416015625, -0.14897537231445312, -0.13968658447265625, -0.13039779663085938, -0.1211090087890625, -0.11182022094726562, -0.10253143310546875, -0.09324264526367188, -0.083953857421875, -0.07466506958007812, -0.06537628173828125, -0.056087493896484375, -0.0467987060546875, -0.037509918212890625, -0.02822113037109375, -0.018932342529296875, -0.0096435546875, -0.000354766845703125, 0.00893402099609375, 0.018222808837890625, 0.0275115966796875, 0.036800384521484375, 0.04608917236328125, 0.055377960205078125, 0.064666748046875, 0.07395553588867188, 0.08324432373046875, 0.09253311157226562, 0.1018218994140625, 0.11111068725585938, 0.12039947509765625, 0.12968826293945312, 0.13897705078125, 0.14826583862304688, 0.15755462646484375, 0.16684341430664062, 0.1761322021484375, 0.18542098999023438, 0.19470977783203125, 0.20399856567382812, 0.213287353515625, 0.22257614135742188, 0.23186492919921875, 0.24115371704101562, 0.2504425048828125, 0.2597312927246094, 0.26902008056640625, 0.2783088684082031, 0.28759765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 9.0, 7.0, 11.0, 13.0, 17.0, 19.0, 17.0, 18.0, 14.0, 22.0, 23.0, 21.0, 36.0, 35.0, 31.0, 24.0, 34.0, 31.0, 38.0, 43.0, 1067.0, 49.0, 38.0, 34.0, 30.0, 20.0, 27.0, 24.0, 27.0, 22.0, 27.0, 21.0, 19.0, 15.0, 17.0, 21.0, 15.0, 15.0, 12.0, 9.0, 8.0, 3.0, 4.0, 3.0, 7.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.8837890625, -1.8196868896484375, -1.755584716796875, -1.6914825439453125, -1.62738037109375, -1.5632781982421875, -1.499176025390625, -1.4350738525390625, -1.3709716796875, -1.3068695068359375, -1.242767333984375, -1.1786651611328125, -1.11456298828125, -1.0504608154296875, -0.986358642578125, -0.9222564697265625, -0.858154296875, -0.7940521240234375, -0.729949951171875, -0.6658477783203125, -0.60174560546875, -0.5376434326171875, -0.473541259765625, -0.4094390869140625, -0.3453369140625, -0.2812347412109375, -0.217132568359375, -0.1530303955078125, -0.08892822265625, -0.0248260498046875, 0.039276123046875, 0.1033782958984375, 0.16748046875, 0.2315826416015625, 0.295684814453125, 0.3597869873046875, 0.42388916015625, 0.4879913330078125, 0.552093505859375, 0.6161956787109375, 0.6802978515625, 0.7444000244140625, 0.808502197265625, 0.8726043701171875, 0.93670654296875, 1.0008087158203125, 1.064910888671875, 1.1290130615234375, 1.193115234375, 1.2572174072265625, 1.321319580078125, 1.3854217529296875, 1.44952392578125, 1.5136260986328125, 1.577728271484375, 1.6418304443359375, 1.7059326171875, 1.7700347900390625, 1.834136962890625, 1.8982391357421875, 1.96234130859375, 2.0264434814453125, 2.090545654296875, 2.1546478271484375, 2.21875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 9.0, 8.0, 19.0, 26.0, 35.0, 46.0, 61.0, 91.0, 139.0, 196.0, 283.0, 393.0, 538.0, 868.0, 1163.0, 1716.0, 2413.0, 3654.0, 5446.0, 7897.0, 11971.0, 18434.0, 28709.0, 46322.0, 79884.0, 165359.0, 1407324.0, 129929.0, 68369.0, 40964.0, 25224.0, 16487.0, 10621.0, 7168.0, 4898.0, 3314.0, 2206.0, 1469.0, 1062.0, 756.0, 534.0, 326.0, 260.0, 174.0, 113.0, 69.0, 57.0, 45.0, 35.0, 18.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0], "bins": [-0.1480712890625, -0.14376258850097656, -0.13945388793945312, -0.1351451873779297, -0.13083648681640625, -0.1265277862548828, -0.12221908569335938, -0.11791038513183594, -0.1136016845703125, -0.10929298400878906, -0.10498428344726562, -0.10067558288574219, -0.09636688232421875, -0.09205818176269531, -0.08774948120117188, -0.08344078063964844, -0.079132080078125, -0.07482337951660156, -0.07051467895507812, -0.06620597839355469, -0.06189727783203125, -0.05758857727050781, -0.053279876708984375, -0.04897117614746094, -0.0446624755859375, -0.04035377502441406, -0.036045074462890625, -0.03173637390136719, -0.02742767333984375, -0.023118972778320312, -0.018810272216796875, -0.014501571655273438, -0.01019287109375, -0.0058841705322265625, -0.001575469970703125, 0.0027332305908203125, 0.00704193115234375, 0.011350631713867188, 0.015659332275390625, 0.019968032836914062, 0.0242767333984375, 0.028585433959960938, 0.032894134521484375, 0.03720283508300781, 0.04151153564453125, 0.04582023620605469, 0.050128936767578125, 0.05443763732910156, 0.058746337890625, 0.06305503845214844, 0.06736373901367188, 0.07167243957519531, 0.07598114013671875, 0.08028984069824219, 0.08459854125976562, 0.08890724182128906, 0.0932159423828125, 0.09752464294433594, 0.10183334350585938, 0.10614204406738281, 0.11045074462890625, 0.11475944519042969, 0.11906814575195312, 0.12337684631347656, 0.127685546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 6.0, 4.0, 4.0, 13.0, 7.0, 17.0, 23.0, 32.0, 40.0, 53.0, 65.0, 109.0, 149.0, 139.0, 92.0, 71.0, 46.0, 32.0, 26.0, 12.0, 13.0, 9.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.562999725341797e-05, -2.4932436645030975e-05, -2.4234876036643982e-05, -2.353731542825699e-05, -2.2839754819869995e-05, -2.2142194211483002e-05, -2.1444633603096008e-05, -2.0747072994709015e-05, -2.004951238632202e-05, -1.9351951777935028e-05, -1.8654391169548035e-05, -1.795683056116104e-05, -1.7259269952774048e-05, -1.6561709344387054e-05, -1.586414873600006e-05, -1.5166588127613068e-05, -1.4469027519226074e-05, -1.377146691083908e-05, -1.3073906302452087e-05, -1.2376345694065094e-05, -1.16787850856781e-05, -1.0981224477291107e-05, -1.0283663868904114e-05, -9.58610326051712e-06, -8.888542652130127e-06, -8.190982043743134e-06, -7.49342143535614e-06, -6.795860826969147e-06, -6.098300218582153e-06, -5.40073961019516e-06, -4.7031790018081665e-06, -4.005618393421173e-06, -3.3080577850341797e-06, -2.6104971766471863e-06, -1.912936568260193e-06, -1.2153759598731995e-06, -5.178153514862061e-07, 1.7974525690078735e-07, 8.773058652877808e-07, 1.5748664736747742e-06, 2.2724270820617676e-06, 2.969987690448761e-06, 3.6675482988357544e-06, 4.365108907222748e-06, 5.062669515609741e-06, 5.760230123996735e-06, 6.457790732383728e-06, 7.1553513407707214e-06, 7.852911949157715e-06, 8.550472557544708e-06, 9.248033165931702e-06, 9.945593774318695e-06, 1.0643154382705688e-05, 1.1340714991092682e-05, 1.2038275599479675e-05, 1.2735836207866669e-05, 1.3433396816253662e-05, 1.4130957424640656e-05, 1.4828518033027649e-05, 1.5526078641414642e-05, 1.6223639249801636e-05, 1.692119985818863e-05, 1.7618760466575623e-05, 1.8316321074962616e-05, 1.901388168334961e-05]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 11.0, 18.0, 14.0, 24.0, 39.0, 59.0, 136.0, 459.0, 4167.0, 121253.0, 897761.0, 22789.0, 1310.0, 203.0, 92.0, 51.0, 37.0, 28.0, 22.0, 11.0, 10.0, 3.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032329559326171875, -0.00031144171953201294, -0.00029958784580230713, -0.0002877339720726013, -0.0002758800983428955, -0.0002640262246131897, -0.0002521723508834839, -0.00024031847715377808, -0.00022846460342407227, -0.00021661072969436646, -0.00020475685596466064, -0.00019290298223495483, -0.00018104910850524902, -0.0001691952347755432, -0.0001573413610458374, -0.0001454874873161316, -0.00013363361358642578, -0.00012177973985671997, -0.00010992586612701416, -9.807199239730835e-05, -8.621811866760254e-05, -7.436424493789673e-05, -6.251037120819092e-05, -5.065649747848511e-05, -3.88026237487793e-05, -2.6948750019073486e-05, -1.5094876289367676e-05, -3.2410025596618652e-06, 8.612871170043945e-06, 2.0466744899749756e-05, 3.2320618629455566e-05, 4.417449235916138e-05, 5.602836608886719e-05, 6.7882239818573e-05, 7.973611354827881e-05, 9.158998727798462e-05, 0.00010344386100769043, 0.00011529773473739624, 0.00012715160846710205, 0.00013900548219680786, 0.00015085935592651367, 0.00016271322965621948, 0.0001745671033859253, 0.0001864209771156311, 0.00019827485084533691, 0.00021012872457504272, 0.00022198259830474854, 0.00023383647203445435, 0.00024569034576416016, 0.00025754421949386597, 0.0002693980932235718, 0.0002812519669532776, 0.0002931058406829834, 0.0003049597144126892, 0.000316813588142395, 0.00032866746187210083, 0.00034052133560180664, 0.00035237520933151245, 0.00036422908306121826, 0.00037608295679092407, 0.0003879368305206299, 0.0003997907042503357, 0.0004116445779800415, 0.0004234984517097473, 0.0004353523254394531]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 14.0, 27.0, 46.0, 76.0, 111.0, 165.0, 195.0, 159.0, 89.0, 52.0, 31.0, 18.0, 8.0, 5.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.4344014895614237e-05, -4.3407755583757535e-05, -4.247149627190083e-05, -4.1535233322065324e-05, -4.059897401020862e-05, -3.966271469835192e-05, -3.872645538649522e-05, -3.7790196074638516e-05, -3.6853936762781814e-05, -3.591767745092511e-05, -3.498141813906841e-05, -3.404515882721171e-05, -3.31088958773762e-05, -3.21726365655195e-05, -3.1236377253662795e-05, -3.0300117941806093e-05, -2.9363854991970584e-05, -2.8427595680113882e-05, -2.7491334549267776e-05, -2.6555075237411074e-05, -2.5618815925554372e-05, -2.4682554794708267e-05, -2.3746295482851565e-05, -2.2810036170994863e-05, -2.187377685913816e-05, -2.093751754728146e-05, -2.0001256416435353e-05, -1.906499710457865e-05, -1.812873779272195e-05, -1.7192476661875844e-05, -1.6256217350019142e-05, -1.531995803816244e-05, -1.4383696907316335e-05, -1.344743668596493e-05, -1.2511177374108229e-05, -1.1574917152756825e-05, -1.0638656931405421e-05, -9.702396710054018e-06, -8.766137398197316e-06, -7.829877176845912e-06, -6.893617410241859e-06, -5.957357643637806e-06, -5.0210974222864024e-06, -4.08483765568235e-06, -3.1485776617046213e-06, -2.212317667726893e-06, -1.2760579011228401e-06, -3.397976797714364e-07, 5.964620868326165e-07, 1.5327220808103448e-06, 2.468982074788073e-06, 3.405241841392126e-06, 4.34150206274353e-06, 5.2777618293475825e-06, 6.214021595951635e-06, 7.150281817303039e-06, 8.086541129159741e-06, 9.022801350511145e-06, 9.959060662367847e-06, 1.089532088371925e-05, 1.1831581105070654e-05, 1.2767841326422058e-05, 1.370410063827876e-05, 1.4640360859630164e-05, 1.5576621080981568e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 8.0, 7.0, 10.0, 16.0, 22.0, 26.0, 17.0, 20.0, 11.0, 25.0, 22.0, 42.0, 32.0, 29.0, 33.0, 43.0, 22.0, 47.0, 49.0, 42.0, 46.0, 37.0, 36.0, 47.0, 39.0, 34.0, 33.0, 24.0, 20.0, 21.0, 18.0, 24.0, 24.0, 15.0, 10.0, 14.0, 11.0, 4.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-06, -8.036382496356964e-06, -7.787719368934631e-06, -7.539056241512299e-06, -7.290393114089966e-06, -7.041729986667633e-06, -6.7930668592453e-06, -6.5444037318229675e-06, -6.295740604400635e-06, -6.047077476978302e-06, -5.798414349555969e-06, -5.5497512221336365e-06, -5.301088094711304e-06, -5.052424967288971e-06, -4.803761839866638e-06, -4.555098712444305e-06, -4.306435585021973e-06, -4.05777245759964e-06, -3.809109330177307e-06, -3.5604462027549744e-06, -3.3117830753326416e-06, -3.063119947910309e-06, -2.814456820487976e-06, -2.5657936930656433e-06, -2.3171305656433105e-06, -2.0684674382209778e-06, -1.819804310798645e-06, -1.5711411833763123e-06, -1.3224780559539795e-06, -1.0738149285316467e-06, -8.25151801109314e-07, -5.764886736869812e-07, -3.2782554626464844e-07, -7.916241884231567e-08, 1.695007085800171e-07, 4.1816383600234985e-07, 6.668269634246826e-07, 9.154900908470154e-07, 1.1641532182693481e-06, 1.412816345691681e-06, 1.6614794731140137e-06, 1.9101426005363464e-06, 2.158805727958679e-06, 2.407468855381012e-06, 2.6561319828033447e-06, 2.9047951102256775e-06, 3.1534582376480103e-06, 3.402121365070343e-06, 3.6507844924926758e-06, 3.8994476199150085e-06, 4.148110747337341e-06, 4.396773874759674e-06, 4.645437002182007e-06, 4.89410012960434e-06, 5.142763257026672e-06, 5.391426384449005e-06, 5.640089511871338e-06, 5.888752639293671e-06, 6.137415766716003e-06, 6.386078894138336e-06, 6.634742021560669e-06, 6.883405148983002e-06, 7.1320682764053345e-06, 7.380731403827667e-06, 7.62939453125e-06]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 10.0, 5.0, 5.0, 10.0, 7.0, 11.0, 19.0, 9.0, 21.0, 28.0, 32.0, 25.0, 42.0, 51.0, 38.0, 50.0, 56.0, 45.0, 35.0, 58.0, 52.0, 45.0, 30.0, 37.0, 38.0, 33.0, 27.0, 25.0, 26.0, 21.0, 18.0, 12.0, 10.0, 15.0, 11.0, 8.0, 7.0, 5.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.10369873046875, -2.9886474609375, -2.87359619140625, -2.758544921875, -2.64349365234375, -2.5284423828125, -2.41339111328125, -2.29833984375, -2.18328857421875, -2.0682373046875, -1.95318603515625, -1.838134765625, -1.72308349609375, -1.6080322265625, -1.49298095703125, -1.3779296875, -1.26287841796875, -1.1478271484375, -1.03277587890625, -0.917724609375, -0.80267333984375, -0.6876220703125, -0.57257080078125, -0.45751953125, -0.34246826171875, -0.2274169921875, -0.11236572265625, 0.002685546875, 0.11773681640625, 0.2327880859375, 0.34783935546875, 0.462890625, 0.57794189453125, 0.6929931640625, 0.80804443359375, 0.923095703125, 1.03814697265625, 1.1531982421875, 1.26824951171875, 1.38330078125, 1.49835205078125, 1.6134033203125, 1.72845458984375, 1.843505859375, 1.95855712890625, 2.0736083984375, 2.18865966796875, 2.3037109375, 2.41876220703125, 2.5338134765625, 2.64886474609375, 2.763916015625, 2.87896728515625, 2.9940185546875, 3.10906982421875, 3.22412109375, 3.33917236328125, 3.4542236328125, 3.56927490234375, 3.684326171875, 3.79937744140625, 3.9144287109375, 4.02947998046875, 4.14453125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 8.0, 13.0, 16.0, 23.0, 34.0, 57.0, 82.0, 139.0, 208.0, 371.0, 558.0, 975.0, 1702.0, 2863.0, 5414.0, 10016.0, 20499.0, 44441.0, 104132.0, 300095.0, 347473.0, 115068.0, 47999.0, 22198.0, 10899.0, 5592.0, 3149.0, 1777.0, 1051.0, 608.0, 402.0, 243.0, 159.0, 90.0, 56.0, 45.0, 28.0, 16.0, 11.0, 10.0, 2.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.818359375, -2.7178955078125, -2.617431640625, -2.5169677734375, -2.41650390625, -2.3160400390625, -2.215576171875, -2.1151123046875, -2.0146484375, -1.9141845703125, -1.813720703125, -1.7132568359375, -1.61279296875, -1.5123291015625, -1.411865234375, -1.3114013671875, -1.2109375, -1.1104736328125, -1.010009765625, -0.9095458984375, -0.80908203125, -0.7086181640625, -0.608154296875, -0.5076904296875, -0.4072265625, -0.3067626953125, -0.206298828125, -0.1058349609375, -0.00537109375, 0.0950927734375, 0.195556640625, 0.2960205078125, 0.396484375, 0.4969482421875, 0.597412109375, 0.6978759765625, 0.79833984375, 0.8988037109375, 0.999267578125, 1.0997314453125, 1.2001953125, 1.3006591796875, 1.401123046875, 1.5015869140625, 1.60205078125, 1.7025146484375, 1.802978515625, 1.9034423828125, 2.00390625, 2.1043701171875, 2.204833984375, 2.3052978515625, 2.40576171875, 2.5062255859375, 2.606689453125, 2.7071533203125, 2.8076171875, 2.9080810546875, 3.008544921875, 3.1090087890625, 3.20947265625, 3.3099365234375, 3.410400390625, 3.5108642578125, 3.611328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 8.0, 5.0, 12.0, 23.0, 19.0, 18.0, 29.0, 14.0, 24.0, 38.0, 38.0, 41.0, 52.0, 41.0, 101.0, 236.0, 1717.0, 148.0, 87.0, 62.0, 42.0, 40.0, 45.0, 29.0, 30.0, 25.0, 28.0, 12.0, 20.0, 14.0, 9.0, 14.0, 8.0, 3.0, 2.0, 0.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4453125, -13.0296630859375, -12.614013671875, -12.1983642578125, -11.78271484375, -11.3670654296875, -10.951416015625, -10.5357666015625, -10.1201171875, -9.7044677734375, -9.288818359375, -8.8731689453125, -8.45751953125, -8.0418701171875, -7.626220703125, -7.2105712890625, -6.794921875, -6.3792724609375, -5.963623046875, -5.5479736328125, -5.13232421875, -4.7166748046875, -4.301025390625, -3.8853759765625, -3.4697265625, -3.0540771484375, -2.638427734375, -2.2227783203125, -1.80712890625, -1.3914794921875, -0.975830078125, -0.5601806640625, -0.14453125, 0.2711181640625, 0.686767578125, 1.1024169921875, 1.51806640625, 1.9337158203125, 2.349365234375, 2.7650146484375, 3.1806640625, 3.5963134765625, 4.011962890625, 4.4276123046875, 4.84326171875, 5.2589111328125, 5.674560546875, 6.0902099609375, 6.505859375, 6.9215087890625, 7.337158203125, 7.7528076171875, 8.16845703125, 8.5841064453125, 8.999755859375, 9.4154052734375, 9.8310546875, 10.2467041015625, 10.662353515625, 11.0780029296875, 11.49365234375, 11.9093017578125, 12.324951171875, 12.7406005859375, 13.15625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 6.0, 8.0, 12.0, 16.0, 13.0, 24.0, 24.0, 37.0, 38.0, 61.0, 87.0, 127.0, 164.0, 241.0, 483.0, 1660.0, 36297.0, 3080996.0, 22703.0, 1445.0, 428.0, 230.0, 154.0, 115.0, 88.0, 51.0, 42.0, 42.0, 27.0, 26.0, 17.0, 10.0, 8.0, 10.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.765625, -24.946533203125, -24.12744140625, -23.308349609375, -22.4892578125, -21.670166015625, -20.85107421875, -20.031982421875, -19.212890625, -18.393798828125, -17.57470703125, -16.755615234375, -15.9365234375, -15.117431640625, -14.29833984375, -13.479248046875, -12.66015625, -11.841064453125, -11.02197265625, -10.202880859375, -9.3837890625, -8.564697265625, -7.74560546875, -6.926513671875, -6.107421875, -5.288330078125, -4.46923828125, -3.650146484375, -2.8310546875, -2.011962890625, -1.19287109375, -0.373779296875, 0.4453125, 1.264404296875, 2.08349609375, 2.902587890625, 3.7216796875, 4.540771484375, 5.35986328125, 6.178955078125, 6.998046875, 7.817138671875, 8.63623046875, 9.455322265625, 10.2744140625, 11.093505859375, 11.91259765625, 12.731689453125, 13.55078125, 14.369873046875, 15.18896484375, 16.008056640625, 16.8271484375, 17.646240234375, 18.46533203125, 19.284423828125, 20.103515625, 20.922607421875, 21.74169921875, 22.560791015625, 23.3798828125, 24.198974609375, 25.01806640625, 25.837158203125, 26.65625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 20.0, 59.0, 129.0, 280.0, 292.0, 152.0, 57.0, 21.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.707942962646484, -39.663387298583984, -38.61883544921875, -37.57427978515625, -36.52972412109375, -35.485172271728516, -34.440616607666016, -33.396060943603516, -32.35150909423828, -31.306955337524414, -30.262399673461914, -29.217845916748047, -28.17329216003418, -27.128738403320312, -26.084182739257812, -25.039628982543945, -23.995073318481445, -22.950519561767578, -21.905963897705078, -20.86141014099121, -19.816856384277344, -18.772300720214844, -17.727746963500977, -16.68319320678711, -15.638638496398926, -14.594083786010742, -13.549530029296875, -12.504975318908691, -11.460420608520508, -10.41586685180664, -9.371312141418457, -8.326757431030273, -7.282201766967773, -6.237647533416748, -5.193093299865723, -4.148538589477539, -3.1039843559265137, -2.0594301223754883, -1.0148754119873047, 0.029678821563720703, 1.074233055114746, 2.1187872886657715, 3.163341760635376, 4.2078962326049805, 5.252450466156006, 6.297004699707031, 7.341559410095215, 8.386114120483398, 9.430667877197266, 10.47522258758545, 11.519776344299316, 12.5643310546875, 13.608884811401367, 14.65343952178955, 15.697994232177734, 16.7425479888916, 17.78710174560547, 18.831655502319336, 19.876211166381836, 20.920764923095703, 21.96531867980957, 23.009872436523438, 24.054428100585938, 25.098981857299805, 26.143537521362305]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 3.0, 11.0, 12.0, 10.0, 12.0, 14.0, 21.0, 19.0, 26.0, 28.0, 25.0, 24.0, 33.0, 20.0, 30.0, 27.0, 42.0, 46.0, 37.0, 43.0, 34.0, 47.0, 40.0, 36.0, 38.0, 45.0, 27.0, 42.0, 23.0, 19.0, 23.0, 20.0, 22.0, 18.0, 8.0, 6.0, 19.0, 7.0, 9.0, 3.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.219924926757812, -27.25336456298828, -26.28680419921875, -25.32024383544922, -24.353683471679688, -23.387123107910156, -22.420562744140625, -21.454002380371094, -20.487442016601562, -19.52088165283203, -18.5543212890625, -17.58776092529297, -16.621200561523438, -15.654640197753906, -14.688078880310059, -13.721518516540527, -12.75495719909668, -11.788396835327148, -10.821836471557617, -9.855276107788086, -8.888715744018555, -7.922154903411865, -6.955594062805176, -5.9890336990356445, -5.022473335266113, -4.055912971496582, -3.0893523693084717, -2.1227917671203613, -1.15623140335083, -0.18967103958129883, 0.7768898010253906, 1.7434501647949219, 2.710010528564453, 3.6765708923339844, 4.643131256103516, 5.609692096710205, 6.576252460479736, 7.542812824249268, 8.509373664855957, 9.475934028625488, 10.44249439239502, 11.40905475616455, 12.375615119934082, 13.34217643737793, 14.308736801147461, 15.275297164916992, 16.241857528686523, 17.208417892456055, 18.174978256225586, 19.141538619995117, 20.10809898376465, 21.07465934753418, 22.04121971130371, 23.007780075073242, 23.974342346191406, 24.940902709960938, 25.90746307373047, 26.8740234375, 27.84058380126953, 28.807144165039062, 29.773704528808594, 30.740264892578125, 31.706825256347656, 32.67338562011719, 33.63994598388672]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 8.0, 9.0, 4.0, 8.0, 8.0, 9.0, 13.0, 13.0, 11.0, 19.0, 35.0, 21.0, 32.0, 42.0, 44.0, 35.0, 49.0, 48.0, 50.0, 48.0, 49.0, 48.0, 48.0, 31.0, 33.0, 42.0, 32.0, 29.0, 30.0, 26.0, 21.0, 19.0, 13.0, 13.0, 12.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.280059814453125, -3.16363525390625, -3.047210693359375, -2.9307861328125, -2.814361572265625, -2.69793701171875, -2.581512451171875, -2.465087890625, -2.348663330078125, -2.23223876953125, -2.115814208984375, -1.9993896484375, -1.882965087890625, -1.76654052734375, -1.650115966796875, -1.53369140625, -1.417266845703125, -1.30084228515625, -1.184417724609375, -1.0679931640625, -0.951568603515625, -0.83514404296875, -0.718719482421875, -0.602294921875, -0.485870361328125, -0.36944580078125, -0.253021240234375, -0.1365966796875, -0.020172119140625, 0.09625244140625, 0.212677001953125, 0.3291015625, 0.445526123046875, 0.56195068359375, 0.678375244140625, 0.7947998046875, 0.911224365234375, 1.02764892578125, 1.144073486328125, 1.260498046875, 1.376922607421875, 1.49334716796875, 1.609771728515625, 1.7261962890625, 1.842620849609375, 1.95904541015625, 2.075469970703125, 2.19189453125, 2.308319091796875, 2.42474365234375, 2.541168212890625, 2.6575927734375, 2.774017333984375, 2.89044189453125, 3.006866455078125, 3.123291015625, 3.239715576171875, 3.35614013671875, 3.472564697265625, 3.5889892578125, 3.705413818359375, 3.82183837890625, 3.938262939453125, 4.0546875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 10.0, 11.0, 19.0, 39.0, 56.0, 82.0, 126.0, 196.0, 303.0, 487.0, 875.0, 1504.0, 2701.0, 5051.0, 10335.0, 22495.0, 55450.0, 161067.0, 576276.0, 1791157.0, 1116204.0, 294191.0, 91089.0, 34245.0, 14936.0, 7120.0, 3601.0, 1965.0, 1093.0, 618.0, 345.0, 221.0, 152.0, 96.0, 66.0, 39.0, 25.0, 19.0, 9.0, 4.0, 5.0, 3.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.85833740234375, -4.6893310546875, -4.52032470703125, -4.351318359375, -4.18231201171875, -4.0133056640625, -3.84429931640625, -3.67529296875, -3.50628662109375, -3.3372802734375, -3.16827392578125, -2.999267578125, -2.83026123046875, -2.6612548828125, -2.49224853515625, -2.3232421875, -2.15423583984375, -1.9852294921875, -1.81622314453125, -1.647216796875, -1.47821044921875, -1.3092041015625, -1.14019775390625, -0.97119140625, -0.80218505859375, -0.6331787109375, -0.46417236328125, -0.295166015625, -0.12615966796875, 0.0428466796875, 0.21185302734375, 0.380859375, 0.54986572265625, 0.7188720703125, 0.88787841796875, 1.056884765625, 1.22589111328125, 1.3948974609375, 1.56390380859375, 1.73291015625, 1.90191650390625, 2.0709228515625, 2.23992919921875, 2.408935546875, 2.57794189453125, 2.7469482421875, 2.91595458984375, 3.0849609375, 3.25396728515625, 3.4229736328125, 3.59197998046875, 3.760986328125, 3.92999267578125, 4.0989990234375, 4.26800537109375, 4.43701171875, 4.60601806640625, 4.7750244140625, 4.94403076171875, 5.113037109375, 5.28204345703125, 5.4510498046875, 5.62005615234375, 5.7890625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 3.0, 8.0, 6.0, 5.0, 12.0, 18.0, 16.0, 33.0, 41.0, 44.0, 65.0, 77.0, 130.0, 143.0, 182.0, 240.0, 302.0, 407.0, 497.0, 416.0, 353.0, 259.0, 187.0, 152.0, 121.0, 85.0, 58.0, 35.0, 36.0, 36.0, 22.0, 21.0, 12.0, 16.0, 7.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-7.609375, -7.40716552734375, -7.2049560546875, -7.00274658203125, -6.800537109375, -6.59832763671875, -6.3961181640625, -6.19390869140625, -5.99169921875, -5.78948974609375, -5.5872802734375, -5.38507080078125, -5.182861328125, -4.98065185546875, -4.7784423828125, -4.57623291015625, -4.3740234375, -4.17181396484375, -3.9696044921875, -3.76739501953125, -3.565185546875, -3.36297607421875, -3.1607666015625, -2.95855712890625, -2.75634765625, -2.55413818359375, -2.3519287109375, -2.14971923828125, -1.947509765625, -1.74530029296875, -1.5430908203125, -1.34088134765625, -1.138671875, -0.93646240234375, -0.7342529296875, -0.53204345703125, -0.329833984375, -0.12762451171875, 0.0745849609375, 0.27679443359375, 0.47900390625, 0.68121337890625, 0.8834228515625, 1.08563232421875, 1.287841796875, 1.49005126953125, 1.6922607421875, 1.89447021484375, 2.0966796875, 2.29888916015625, 2.5010986328125, 2.70330810546875, 2.905517578125, 3.10772705078125, 3.3099365234375, 3.51214599609375, 3.71435546875, 3.91656494140625, 4.1187744140625, 4.32098388671875, 4.523193359375, 4.72540283203125, 4.9276123046875, 5.12982177734375, 5.33203125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 13.0, 7.0, 15.0, 16.0, 23.0, 34.0, 59.0, 69.0, 88.0, 151.0, 211.0, 342.0, 867.0, 5337.0, 114080.0, 3680037.0, 379299.0, 11006.0, 1358.0, 460.0, 249.0, 162.0, 118.0, 88.0, 56.0, 38.0, 22.0, 15.0, 14.0, 14.0, 6.0, 6.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.953125, -24.050537109375, -23.14794921875, -22.245361328125, -21.3427734375, -20.440185546875, -19.53759765625, -18.635009765625, -17.732421875, -16.829833984375, -15.92724609375, -15.024658203125, -14.1220703125, -13.219482421875, -12.31689453125, -11.414306640625, -10.51171875, -9.609130859375, -8.70654296875, -7.803955078125, -6.9013671875, -5.998779296875, -5.09619140625, -4.193603515625, -3.291015625, -2.388427734375, -1.48583984375, -0.583251953125, 0.3193359375, 1.221923828125, 2.12451171875, 3.027099609375, 3.9296875, 4.832275390625, 5.73486328125, 6.637451171875, 7.5400390625, 8.442626953125, 9.34521484375, 10.247802734375, 11.150390625, 12.052978515625, 12.95556640625, 13.858154296875, 14.7607421875, 15.663330078125, 16.56591796875, 17.468505859375, 18.37109375, 19.273681640625, 20.17626953125, 21.078857421875, 21.9814453125, 22.884033203125, 23.78662109375, 24.689208984375, 25.591796875, 26.494384765625, 27.39697265625, 28.299560546875, 29.2021484375, 30.104736328125, 31.00732421875, 31.909912109375, 32.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 24.0, 75.0, 149.0, 218.0, 197.0, 164.0, 115.0, 41.0, 13.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.221282958984375, -50.61147689819336, -48.00167465209961, -45.391868591308594, -42.782066345214844, -40.17226028442383, -37.56245422363281, -34.95265197753906, -32.34284591674805, -29.733041763305664, -27.12323760986328, -24.513431549072266, -21.903627395629883, -19.2938232421875, -16.684017181396484, -14.074213027954102, -11.464408874511719, -8.854604721069336, -6.244799613952637, -3.6349949836730957, -1.0251903533935547, 1.5846138000488281, 4.194418907165527, 6.804224014282227, 9.41402816772461, 12.023832321166992, 14.633637428283691, 17.24344253540039, 19.853246688842773, 22.463050842285156, 25.072856903076172, 27.682661056518555, 30.292457580566406, 32.90226364135742, 35.51206588745117, 38.12187194824219, 40.73167419433594, 43.34148025512695, 45.95128631591797, 48.56108856201172, 51.170894622802734, 53.78070068359375, 56.3905029296875, 59.000308990478516, 61.61011505126953, 64.21991729736328, 66.82971954345703, 69.43952941894531, 72.04933166503906, 74.65913391113281, 77.2689437866211, 79.87874603271484, 82.4885482788086, 85.09835815429688, 87.70816040039062, 90.31796264648438, 92.92776489257812, 95.53756713867188, 98.14737701416016, 100.7571792602539, 103.36698150634766, 105.97679138183594, 108.58659362792969, 111.19639587402344, 113.80620574951172]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 13.0, 9.0, 17.0, 22.0, 28.0, 23.0, 16.0, 27.0, 28.0, 36.0, 26.0, 27.0, 48.0, 34.0, 43.0, 36.0, 51.0, 38.0, 38.0, 39.0, 57.0, 39.0, 41.0, 31.0, 34.0, 22.0, 28.0, 23.0, 11.0, 17.0, 10.0, 13.0, 9.0, 13.0, 10.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.25274658203125, -22.515350341796875, -21.777952194213867, -21.040555953979492, -20.303157806396484, -19.56576156616211, -18.828365325927734, -18.090967178344727, -17.35356903076172, -16.616172790527344, -15.878774642944336, -15.141378402709961, -14.403980255126953, -13.666584014892578, -12.929186820983887, -12.191789627075195, -11.45439338684082, -10.716996192932129, -9.979598999023438, -9.242202758789062, -8.504804611206055, -7.7674078941345215, -7.030011177062988, -6.292613983154297, -5.5552167892456055, -4.817819595336914, -4.080422401428223, -3.3430256843566895, -2.605628490447998, -1.8682312965393066, -1.1308345794677734, -0.39343738555908203, 0.3439598083496094, 1.0813568830490112, 1.818753957748413, 2.5561509132385254, 3.293548107147217, 4.030945301055908, 4.768342018127441, 5.505739212036133, 6.243136405944824, 6.980533599853516, 7.717930793762207, 8.455327987670898, 9.192724227905273, 9.930122375488281, 10.667518615722656, 11.404915809631348, 12.142313003540039, 12.87971019744873, 13.617107391357422, 14.354503631591797, 15.091901779174805, 15.82929801940918, 16.566696166992188, 17.304092407226562, 18.041488647460938, 18.778884887695312, 19.51628303527832, 20.253679275512695, 20.991077423095703, 21.728473663330078, 22.465869903564453, 23.20326805114746, 23.94066619873047]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 2.0, 7.0, 5.0, 9.0, 8.0, 8.0, 6.0, 11.0, 16.0, 19.0, 20.0, 16.0, 25.0, 39.0, 35.0, 43.0, 38.0, 45.0, 46.0, 42.0, 49.0, 35.0, 41.0, 43.0, 40.0, 33.0, 30.0, 38.0, 33.0, 26.0, 27.0, 27.0, 21.0, 16.0, 14.0, 16.0, 8.0, 12.0, 9.0, 7.0, 8.0, 5.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.54296875, -3.434814453125, -3.32666015625, -3.218505859375, -3.1103515625, -3.002197265625, -2.89404296875, -2.785888671875, -2.677734375, -2.569580078125, -2.46142578125, -2.353271484375, -2.2451171875, -2.136962890625, -2.02880859375, -1.920654296875, -1.8125, -1.704345703125, -1.59619140625, -1.488037109375, -1.3798828125, -1.271728515625, -1.16357421875, -1.055419921875, -0.947265625, -0.839111328125, -0.73095703125, -0.622802734375, -0.5146484375, -0.406494140625, -0.29833984375, -0.190185546875, -0.08203125, 0.026123046875, 0.13427734375, 0.242431640625, 0.3505859375, 0.458740234375, 0.56689453125, 0.675048828125, 0.783203125, 0.891357421875, 0.99951171875, 1.107666015625, 1.2158203125, 1.323974609375, 1.43212890625, 1.540283203125, 1.6484375, 1.756591796875, 1.86474609375, 1.972900390625, 2.0810546875, 2.189208984375, 2.29736328125, 2.405517578125, 2.513671875, 2.621826171875, 2.72998046875, 2.838134765625, 2.9462890625, 3.054443359375, 3.16259765625, 3.270751953125, 3.37890625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 16.0, 25.0, 26.0, 31.0, 50.0, 79.0, 110.0, 195.0, 269.0, 348.0, 487.0, 774.0, 1133.0, 1540.0, 2258.0, 3273.0, 4706.0, 6861.0, 10331.0, 15723.0, 24873.0, 39823.0, 66207.0, 126211.0, 353662.0, 174257.0, 82342.0, 47376.0, 29272.0, 18539.0, 11940.0, 7949.0, 5436.0, 3779.0, 2594.0, 1872.0, 1309.0, 855.0, 631.0, 442.0, 315.0, 196.0, 126.0, 106.0, 62.0, 44.0, 38.0, 26.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.261962890625, -0.2539482116699219, -0.24593353271484375, -0.23791885375976562, -0.2299041748046875, -0.22188949584960938, -0.21387481689453125, -0.20586013793945312, -0.197845458984375, -0.18983078002929688, -0.18181610107421875, -0.17380142211914062, -0.1657867431640625, -0.15777206420898438, -0.14975738525390625, -0.14174270629882812, -0.13372802734375, -0.12571334838867188, -0.11769866943359375, -0.10968399047851562, -0.1016693115234375, -0.09365463256835938, -0.08563995361328125, -0.07762527465820312, -0.069610595703125, -0.061595916748046875, -0.05358123779296875, -0.045566558837890625, -0.0375518798828125, -0.029537200927734375, -0.02152252197265625, -0.013507843017578125, -0.0054931640625, 0.002521514892578125, 0.01053619384765625, 0.018550872802734375, 0.0265655517578125, 0.034580230712890625, 0.04259490966796875, 0.050609588623046875, 0.058624267578125, 0.06663894653320312, 0.07465362548828125, 0.08266830444335938, 0.0906829833984375, 0.09869766235351562, 0.10671234130859375, 0.11472702026367188, 0.12274169921875, 0.13075637817382812, 0.13877105712890625, 0.14678573608398438, 0.1548004150390625, 0.16281509399414062, 0.17082977294921875, 0.17884445190429688, 0.186859130859375, 0.19487380981445312, 0.20288848876953125, 0.21090316772460938, 0.2189178466796875, 0.22693252563476562, 0.23494720458984375, 0.24296188354492188, 0.2509765625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 14.0, 24.0, 19.0, 25.0, 18.0, 24.0, 19.0, 28.0, 28.0, 38.0, 25.0, 36.0, 32.0, 35.0, 37.0, 35.0, 1062.0, 43.0, 30.0, 44.0, 38.0, 31.0, 31.0, 34.0, 23.0, 28.0, 31.0, 20.0, 13.0, 13.0, 15.0, 17.0, 10.0, 11.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-2.12890625, -2.060272216796875, -1.99163818359375, -1.923004150390625, -1.8543701171875, -1.785736083984375, -1.71710205078125, -1.648468017578125, -1.579833984375, -1.511199951171875, -1.44256591796875, -1.373931884765625, -1.3052978515625, -1.236663818359375, -1.16802978515625, -1.099395751953125, -1.03076171875, -0.962127685546875, -0.89349365234375, -0.824859619140625, -0.7562255859375, -0.687591552734375, -0.61895751953125, -0.550323486328125, -0.481689453125, -0.413055419921875, -0.34442138671875, -0.275787353515625, -0.2071533203125, -0.138519287109375, -0.06988525390625, -0.001251220703125, 0.0673828125, 0.136016845703125, 0.20465087890625, 0.273284912109375, 0.3419189453125, 0.410552978515625, 0.47918701171875, 0.547821044921875, 0.616455078125, 0.685089111328125, 0.75372314453125, 0.822357177734375, 0.8909912109375, 0.959625244140625, 1.02825927734375, 1.096893310546875, 1.16552734375, 1.234161376953125, 1.30279541015625, 1.371429443359375, 1.4400634765625, 1.508697509765625, 1.57733154296875, 1.645965576171875, 1.714599609375, 1.783233642578125, 1.85186767578125, 1.920501708984375, 1.9891357421875, 2.057769775390625, 2.12640380859375, 2.195037841796875, 2.263671875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 11.0, 24.0, 23.0, 37.0, 50.0, 89.0, 106.0, 132.0, 211.0, 287.0, 433.0, 568.0, 859.0, 1220.0, 1728.0, 2427.0, 3679.0, 5503.0, 8186.0, 12410.0, 19644.0, 31914.0, 54019.0, 98008.0, 236050.0, 1351994.0, 110966.0, 59300.0, 34784.0, 21617.0, 13637.0, 8823.0, 5830.0, 3901.0, 2712.0, 1782.0, 1224.0, 847.0, 620.0, 436.0, 322.0, 218.0, 151.0, 94.0, 61.0, 61.0, 39.0, 20.0, 23.0, 15.0, 8.0, 9.0, 4.0, 3.0, 0.0, 3.0], "bins": [-0.15185546875, -0.14726638793945312, -0.14267730712890625, -0.13808822631835938, -0.1334991455078125, -0.12891006469726562, -0.12432098388671875, -0.11973190307617188, -0.115142822265625, -0.11055374145507812, -0.10596466064453125, -0.10137557983398438, -0.0967864990234375, -0.09219741821289062, -0.08760833740234375, -0.08301925659179688, -0.07843017578125, -0.07384109497070312, -0.06925201416015625, -0.06466293334960938, -0.0600738525390625, -0.055484771728515625, -0.05089569091796875, -0.046306610107421875, -0.041717529296875, -0.037128448486328125, -0.03253936767578125, -0.027950286865234375, -0.0233612060546875, -0.018772125244140625, -0.01418304443359375, -0.009593963623046875, -0.0050048828125, -0.000415802001953125, 0.00417327880859375, 0.008762359619140625, 0.0133514404296875, 0.017940521240234375, 0.02252960205078125, 0.027118682861328125, 0.031707763671875, 0.036296844482421875, 0.04088592529296875, 0.045475006103515625, 0.0500640869140625, 0.054653167724609375, 0.05924224853515625, 0.06383132934570312, 0.06842041015625, 0.07300949096679688, 0.07759857177734375, 0.08218765258789062, 0.0867767333984375, 0.09136581420898438, 0.09595489501953125, 0.10054397583007812, 0.105133056640625, 0.10972213745117188, 0.11431121826171875, 0.11890029907226562, 0.1234893798828125, 0.12807846069335938, 0.13266754150390625, 0.13725662231445312, 0.141845703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 7.0, 15.0, 17.0, 28.0, 23.0, 27.0, 44.0, 52.0, 68.0, 87.0, 101.0, 89.0, 80.0, 77.0, 46.0, 35.0, 33.0, 30.0, 16.0, 21.0, 7.0, 8.0, 10.0, 9.0, 9.0, 8.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1742115020751953e-05, -1.1364929378032684e-05, -1.0987743735313416e-05, -1.0610558092594147e-05, -1.0233372449874878e-05, -9.856186807155609e-06, -9.47900116443634e-06, -9.101815521717072e-06, -8.724629878997803e-06, -8.347444236278534e-06, -7.970258593559265e-06, -7.593072950839996e-06, -7.2158873081207275e-06, -6.838701665401459e-06, -6.46151602268219e-06, -6.084330379962921e-06, -5.707144737243652e-06, -5.3299590945243835e-06, -4.952773451805115e-06, -4.575587809085846e-06, -4.198402166366577e-06, -3.821216523647308e-06, -3.4440308809280396e-06, -3.0668452382087708e-06, -2.689659595489502e-06, -2.312473952770233e-06, -1.9352883100509644e-06, -1.5581026673316956e-06, -1.1809170246124268e-06, -8.03731381893158e-07, -4.2654573917388916e-07, -4.936009645462036e-08, 3.2782554626464844e-07, 7.050111889839172e-07, 1.082196831703186e-06, 1.4593824744224548e-06, 1.8365681171417236e-06, 2.2137537598609924e-06, 2.5909394025802612e-06, 2.96812504529953e-06, 3.345310688018799e-06, 3.7224963307380676e-06, 4.0996819734573364e-06, 4.476867616176605e-06, 4.854053258895874e-06, 5.231238901615143e-06, 5.608424544334412e-06, 5.98561018705368e-06, 6.362795829772949e-06, 6.739981472492218e-06, 7.117167115211487e-06, 7.494352757930756e-06, 7.871538400650024e-06, 8.248724043369293e-06, 8.625909686088562e-06, 9.00309532880783e-06, 9.3802809715271e-06, 9.757466614246368e-06, 1.0134652256965637e-05, 1.0511837899684906e-05, 1.0889023542404175e-05, 1.1266209185123444e-05, 1.1643394827842712e-05, 1.2020580470561981e-05, 1.239776611328125e-05]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 4.0, 5.0, 16.0, 15.0, 10.0, 15.0, 26.0, 31.0, 38.0, 72.0, 104.0, 220.0, 1130.0, 9777.0, 145421.0, 831037.0, 55019.0, 4502.0, 619.0, 159.0, 87.0, 58.0, 43.0, 34.0, 28.0, 18.0, 10.0, 7.0, 4.0, 9.0, 4.0, 5.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002372264862060547, -0.0002301093190908432, -0.00022299215197563171, -0.00021587498486042023, -0.00020875781774520874, -0.00020164065062999725, -0.00019452348351478577, -0.00018740631639957428, -0.0001802891492843628, -0.0001731719821691513, -0.00016605481505393982, -0.00015893764793872833, -0.00015182048082351685, -0.00014470331370830536, -0.00013758614659309387, -0.00013046897947788239, -0.0001233518123626709, -0.00011623464524745941, -0.00010911747813224792, -0.00010200031101703644, -9.488314390182495e-05, -8.776597678661346e-05, -8.064880967140198e-05, -7.353164255619049e-05, -6.6414475440979e-05, -5.929730832576752e-05, -5.218014121055603e-05, -4.5062974095344543e-05, -3.794580698013306e-05, -3.082863986492157e-05, -2.3711472749710083e-05, -1.6594305634498596e-05, -9.47713851928711e-06, -2.3599714040756226e-06, 4.757195711135864e-06, 1.1874362826347351e-05, 1.8991529941558838e-05, 2.6108697056770325e-05, 3.322586417198181e-05, 4.03430312871933e-05, 4.7460198402404785e-05, 5.457736551761627e-05, 6.169453263282776e-05, 6.881169974803925e-05, 7.592886686325073e-05, 8.304603397846222e-05, 9.01632010936737e-05, 9.728036820888519e-05, 0.00010439753532409668, 0.00011151470243930817, 0.00011863186955451965, 0.00012574903666973114, 0.00013286620378494263, 0.00013998337090015411, 0.0001471005380153656, 0.0001542177051305771, 0.00016133487224578857, 0.00016845203936100006, 0.00017556920647621155, 0.00018268637359142303, 0.00018980354070663452, 0.000196920707821846, 0.0002040378749370575, 0.00021115504205226898, 0.00021827220916748047]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 24.0, 57.0, 103.0, 176.0, 273.0, 197.0, 92.0, 45.0, 20.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.339744969503954e-05, -2.2306276150629856e-05, -2.121510260622017e-05, -2.0123927242821082e-05, -1.9032753698411398e-05, -1.7941580154001713e-05, -1.6850404790602624e-05, -1.575923124619294e-05, -1.4668057701783255e-05, -1.357688415737357e-05, -1.2485709703469183e-05, -1.1394535249564797e-05, -1.0303361705155112e-05, -9.212188160745427e-06, -8.12101370684104e-06, -7.029839252936654e-06, -5.938665708526969e-06, -4.847491709369933e-06, -3.7563177102128975e-06, -2.6651437110558618e-06, -1.573969711898826e-06, -4.827957127417903e-07, 6.083782864152454e-07, 1.699552740319632e-06, 2.790726284729317e-06, 3.8819002838863526e-06, 4.973074283043388e-06, 6.064248282200424e-06, 7.15542228135746e-06, 8.246595825767145e-06, 9.337770279671531e-06, 1.0428944733575918e-05, 1.1520118277985603e-05, 1.2611291822395287e-05, 1.3702466276299674e-05, 1.479364073020406e-05, 1.5884814274613746e-05, 1.697598781902343e-05, 1.806716318242252e-05, 1.9158336726832204e-05, 2.024951027124189e-05, 2.1340683815651573e-05, 2.2431857360061258e-05, 2.3523032723460346e-05, 2.461420626787003e-05, 2.5705379812279716e-05, 2.6796555175678805e-05, 2.788772872008849e-05, 2.8978902264498174e-05, 3.007007580890786e-05, 3.1161249353317544e-05, 3.225242471671663e-05, 3.3343596442136914e-05, 3.4434771805536e-05, 3.552594716893509e-05, 3.661712253233418e-05, 3.770829425775446e-05, 3.879946962115355e-05, 3.989064134657383e-05, 4.098181670997292e-05, 4.2072992073372006e-05, 4.316416379879229e-05, 4.4255339162191376e-05, 4.534651088761166e-05, 4.6437686251010746e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 6.0, 6.0, 5.0, 8.0, 10.0, 6.0, 16.0, 13.0, 22.0, 23.0, 31.0, 16.0, 32.0, 41.0, 41.0, 38.0, 20.0, 33.0, 29.0, 43.0, 37.0, 25.0, 34.0, 37.0, 44.0, 47.0, 44.0, 28.0, 36.0, 29.0, 18.0, 16.0, 22.0, 26.0, 22.0, 22.0, 20.0, 7.0, 8.0, 11.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.304813385009766e-06, -5.1371753215789795e-06, -4.969537258148193e-06, -4.801899194717407e-06, -4.634261131286621e-06, -4.466623067855835e-06, -4.298985004425049e-06, -4.131346940994263e-06, -3.9637088775634766e-06, -3.7960708141326904e-06, -3.6284327507019043e-06, -3.460794687271118e-06, -3.293156623840332e-06, -3.125518560409546e-06, -2.9578804969787598e-06, -2.7902424335479736e-06, -2.6226043701171875e-06, -2.4549663066864014e-06, -2.2873282432556152e-06, -2.119690179824829e-06, -1.952052116394043e-06, -1.7844140529632568e-06, -1.6167759895324707e-06, -1.4491379261016846e-06, -1.2814998626708984e-06, -1.1138617992401123e-06, -9.462237358093262e-07, -7.7858567237854e-07, -6.109476089477539e-07, -4.4330954551696777e-07, -2.7567148208618164e-07, -1.0803341865539551e-07, 5.960464477539063e-08, 2.2724270820617676e-07, 3.948807716369629e-07, 5.62518835067749e-07, 7.301568984985352e-07, 8.977949619293213e-07, 1.0654330253601074e-06, 1.2330710887908936e-06, 1.4007091522216797e-06, 1.5683472156524658e-06, 1.735985279083252e-06, 1.903623342514038e-06, 2.0712614059448242e-06, 2.2388994693756104e-06, 2.4065375328063965e-06, 2.5741755962371826e-06, 2.7418136596679688e-06, 2.909451723098755e-06, 3.077089786529541e-06, 3.244727849960327e-06, 3.4123659133911133e-06, 3.5800039768218994e-06, 3.7476420402526855e-06, 3.915280103683472e-06, 4.082918167114258e-06, 4.250556230545044e-06, 4.41819429397583e-06, 4.585832357406616e-06, 4.753470420837402e-06, 4.9211084842681885e-06, 5.088746547698975e-06, 5.256384611129761e-06, 5.424022674560547e-06]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 2.0, 7.0, 5.0, 9.0, 8.0, 8.0, 6.0, 11.0, 16.0, 19.0, 20.0, 16.0, 25.0, 39.0, 35.0, 43.0, 38.0, 45.0, 46.0, 42.0, 49.0, 35.0, 41.0, 43.0, 40.0, 33.0, 30.0, 38.0, 33.0, 26.0, 27.0, 27.0, 21.0, 16.0, 14.0, 16.0, 8.0, 12.0, 9.0, 7.0, 8.0, 5.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.54296875, -3.434814453125, -3.32666015625, -3.218505859375, -3.1103515625, -3.002197265625, -2.89404296875, -2.785888671875, -2.677734375, -2.569580078125, -2.46142578125, -2.353271484375, -2.2451171875, -2.136962890625, -2.02880859375, -1.920654296875, -1.8125, -1.704345703125, -1.59619140625, -1.488037109375, -1.3798828125, -1.271728515625, -1.16357421875, -1.055419921875, -0.947265625, -0.839111328125, -0.73095703125, -0.622802734375, -0.5146484375, -0.406494140625, -0.29833984375, -0.190185546875, -0.08203125, 0.026123046875, 0.13427734375, 0.242431640625, 0.3505859375, 0.458740234375, 0.56689453125, 0.675048828125, 0.783203125, 0.891357421875, 0.99951171875, 1.107666015625, 1.2158203125, 1.323974609375, 1.43212890625, 1.540283203125, 1.6484375, 1.756591796875, 1.86474609375, 1.972900390625, 2.0810546875, 2.189208984375, 2.29736328125, 2.405517578125, 2.513671875, 2.621826171875, 2.72998046875, 2.838134765625, 2.9462890625, 3.054443359375, 3.16259765625, 3.270751953125, 3.37890625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 13.0, 23.0, 41.0, 51.0, 101.0, 162.0, 281.0, 438.0, 851.0, 1537.0, 2712.0, 4865.0, 8861.0, 17578.0, 35563.0, 74234.0, 174076.0, 403611.0, 175040.0, 75253.0, 35809.0, 17651.0, 8866.0, 4682.0, 2661.0, 1528.0, 854.0, 495.0, 305.0, 178.0, 101.0, 56.0, 40.0, 21.0, 7.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.95623779296875, -3.8265380859375, -3.69683837890625, -3.567138671875, -3.43743896484375, -3.3077392578125, -3.17803955078125, -3.04833984375, -2.91864013671875, -2.7889404296875, -2.65924072265625, -2.529541015625, -2.39984130859375, -2.2701416015625, -2.14044189453125, -2.0107421875, -1.88104248046875, -1.7513427734375, -1.62164306640625, -1.491943359375, -1.36224365234375, -1.2325439453125, -1.10284423828125, -0.97314453125, -0.84344482421875, -0.7137451171875, -0.58404541015625, -0.454345703125, -0.32464599609375, -0.1949462890625, -0.06524658203125, 0.064453125, 0.19415283203125, 0.3238525390625, 0.45355224609375, 0.583251953125, 0.71295166015625, 0.8426513671875, 0.97235107421875, 1.10205078125, 1.23175048828125, 1.3614501953125, 1.49114990234375, 1.620849609375, 1.75054931640625, 1.8802490234375, 2.00994873046875, 2.1396484375, 2.26934814453125, 2.3990478515625, 2.52874755859375, 2.658447265625, 2.78814697265625, 2.9178466796875, 3.04754638671875, 3.17724609375, 3.30694580078125, 3.4366455078125, 3.56634521484375, 3.696044921875, 3.82574462890625, 3.9554443359375, 4.08514404296875, 4.21484375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 16.0, 12.0, 10.0, 13.0, 13.0, 20.0, 25.0, 26.0, 32.0, 31.0, 43.0, 30.0, 40.0, 55.0, 74.0, 134.0, 311.0, 1506.0, 154.0, 70.0, 62.0, 54.0, 42.0, 36.0, 29.0, 29.0, 19.0, 26.0, 15.0, 13.0, 10.0, 15.0, 10.0, 10.0, 11.0, 4.0, 7.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.140625, -11.762939453125, -11.38525390625, -11.007568359375, -10.6298828125, -10.252197265625, -9.87451171875, -9.496826171875, -9.119140625, -8.741455078125, -8.36376953125, -7.986083984375, -7.6083984375, -7.230712890625, -6.85302734375, -6.475341796875, -6.09765625, -5.719970703125, -5.34228515625, -4.964599609375, -4.5869140625, -4.209228515625, -3.83154296875, -3.453857421875, -3.076171875, -2.698486328125, -2.32080078125, -1.943115234375, -1.5654296875, -1.187744140625, -0.81005859375, -0.432373046875, -0.0546875, 0.322998046875, 0.70068359375, 1.078369140625, 1.4560546875, 1.833740234375, 2.21142578125, 2.589111328125, 2.966796875, 3.344482421875, 3.72216796875, 4.099853515625, 4.4775390625, 4.855224609375, 5.23291015625, 5.610595703125, 5.98828125, 6.365966796875, 6.74365234375, 7.121337890625, 7.4990234375, 7.876708984375, 8.25439453125, 8.632080078125, 9.009765625, 9.387451171875, 9.76513671875, 10.142822265625, 10.5205078125, 10.898193359375, 11.27587890625, 11.653564453125, 12.03125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 10.0, 3.0, 5.0, 10.0, 17.0, 7.0, 18.0, 16.0, 31.0, 28.0, 53.0, 43.0, 67.0, 86.0, 118.0, 193.0, 302.0, 737.0, 3312.0, 43789.0, 2935581.0, 152658.0, 6352.0, 1085.0, 378.0, 208.0, 128.0, 115.0, 67.0, 61.0, 42.0, 33.0, 30.0, 26.0, 14.0, 15.0, 17.0, 6.0, 12.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-26.875, -26.02587890625, -25.1767578125, -24.32763671875, -23.478515625, -22.62939453125, -21.7802734375, -20.93115234375, -20.08203125, -19.23291015625, -18.3837890625, -17.53466796875, -16.685546875, -15.83642578125, -14.9873046875, -14.13818359375, -13.2890625, -12.43994140625, -11.5908203125, -10.74169921875, -9.892578125, -9.04345703125, -8.1943359375, -7.34521484375, -6.49609375, -5.64697265625, -4.7978515625, -3.94873046875, -3.099609375, -2.25048828125, -1.4013671875, -0.55224609375, 0.296875, 1.14599609375, 1.9951171875, 2.84423828125, 3.693359375, 4.54248046875, 5.3916015625, 6.24072265625, 7.08984375, 7.93896484375, 8.7880859375, 9.63720703125, 10.486328125, 11.33544921875, 12.1845703125, 13.03369140625, 13.8828125, 14.73193359375, 15.5810546875, 16.43017578125, 17.279296875, 18.12841796875, 18.9775390625, 19.82666015625, 20.67578125, 21.52490234375, 22.3740234375, 23.22314453125, 24.072265625, 24.92138671875, 25.7705078125, 26.61962890625, 27.46875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 15.0, 71.0, 260.0, 387.0, 207.0, 62.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.00815200805664, -13.837268829345703, -11.666386604309082, -9.495504379272461, -7.324621200561523, -5.153738021850586, -2.982855796813965, -0.8119735717773438, 1.3589096069335938, 3.529792308807373, 5.700675010681152, 7.871557712554932, 10.042440414428711, 12.213323593139648, 14.38420581817627, 16.55508804321289, 18.725971221923828, 20.896854400634766, 23.067737579345703, 25.238618850708008, 27.409502029418945, 29.580385208129883, 31.751266479492188, 33.922149658203125, 36.09303283691406, 38.263916015625, 40.43479919433594, 42.605682373046875, 44.77656555175781, 46.94744873046875, 49.11832809448242, 51.28921127319336, 53.46009063720703, 55.63097381591797, 57.801856994628906, 59.972740173339844, 62.14362335205078, 64.31450653076172, 66.48538970947266, 68.65626525878906, 70.8271484375, 72.99803161621094, 75.16891479492188, 77.33979797363281, 79.51068115234375, 81.68156433105469, 83.85244750976562, 86.02333068847656, 88.1942138671875, 90.36509704589844, 92.53598022460938, 94.70686340332031, 96.87774658203125, 99.04862976074219, 101.21951293945312, 103.39039611816406, 105.561279296875, 107.73216247558594, 109.90304565429688, 112.07392883300781, 114.24481201171875, 116.41569519042969, 118.58657836914062, 120.75746154785156, 122.92833709716797]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 5.0, 7.0, 9.0, 17.0, 12.0, 29.0, 21.0, 21.0, 24.0, 27.0, 36.0, 36.0, 31.0, 32.0, 40.0, 44.0, 27.0, 39.0, 37.0, 35.0, 50.0, 47.0, 29.0, 30.0, 34.0, 31.0, 44.0, 20.0, 19.0, 19.0, 20.0, 17.0, 19.0, 11.0, 13.0, 10.0, 6.0, 13.0, 5.0, 4.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.546459197998047, -30.5489501953125, -29.551441192626953, -28.553932189941406, -27.55642318725586, -26.558914184570312, -25.5614070892334, -24.56389808654785, -23.566389083862305, -22.568880081176758, -21.57137107849121, -20.573862075805664, -19.57635498046875, -18.578845977783203, -17.581336975097656, -16.58382797241211, -15.586318969726562, -14.588809967041016, -13.591300964355469, -12.593792915344238, -11.596283912658691, -10.598774909973145, -9.601266860961914, -8.603757858276367, -7.60624885559082, -6.608739852905273, -5.611231327056885, -4.613722801208496, -3.616213798522949, -2.6187047958374023, -1.6211962699890137, -0.623687744140625, 0.3738212585449219, 1.3713300228118896, 2.3688387870788574, 3.366347551345825, 4.363856315612793, 5.36136531829834, 6.3588738441467285, 7.356382369995117, 8.353891372680664, 9.351400375366211, 10.348909378051758, 11.346417427062988, 12.343926429748535, 13.341435432434082, 14.338943481445312, 15.33645248413086, 16.333961486816406, 17.331470489501953, 18.3289794921875, 19.326488494873047, 20.323997497558594, 21.32150650024414, 22.319013595581055, 23.3165225982666, 24.31403160095215, 25.311540603637695, 26.309049606323242, 27.30655860900879, 28.304065704345703, 29.30157470703125, 30.299083709716797, 31.296592712402344, 32.29410171508789]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 9.0, 9.0, 6.0, 6.0, 6.0, 12.0, 18.0, 13.0, 18.0, 18.0, 38.0, 22.0, 24.0, 52.0, 48.0, 39.0, 45.0, 41.0, 47.0, 33.0, 43.0, 49.0, 28.0, 43.0, 37.0, 36.0, 26.0, 31.0, 23.0, 35.0, 21.0, 19.0, 18.0, 10.0, 11.0, 11.0, 8.0, 6.0, 7.0, 8.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.875, -3.760894775390625, -3.64678955078125, -3.532684326171875, -3.4185791015625, -3.304473876953125, -3.19036865234375, -3.076263427734375, -2.962158203125, -2.848052978515625, -2.73394775390625, -2.619842529296875, -2.5057373046875, -2.391632080078125, -2.27752685546875, -2.163421630859375, -2.04931640625, -1.935211181640625, -1.82110595703125, -1.707000732421875, -1.5928955078125, -1.478790283203125, -1.36468505859375, -1.250579833984375, -1.136474609375, -1.022369384765625, -0.90826416015625, -0.794158935546875, -0.6800537109375, -0.565948486328125, -0.45184326171875, -0.337738037109375, -0.2236328125, -0.109527587890625, 0.00457763671875, 0.118682861328125, 0.2327880859375, 0.346893310546875, 0.46099853515625, 0.575103759765625, 0.689208984375, 0.803314208984375, 0.91741943359375, 1.031524658203125, 1.1456298828125, 1.259735107421875, 1.37384033203125, 1.487945556640625, 1.60205078125, 1.716156005859375, 1.83026123046875, 1.944366455078125, 2.0584716796875, 2.172576904296875, 2.28668212890625, 2.400787353515625, 2.514892578125, 2.628997802734375, 2.74310302734375, 2.857208251953125, 2.9713134765625, 3.085418701171875, 3.19952392578125, 3.313629150390625, 3.427734375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 11.0, 17.0, 15.0, 12.0, 19.0, 36.0, 29.0, 50.0, 83.0, 165.0, 325.0, 714.0, 1801.0, 5232.0, 18311.0, 82901.0, 674367.0, 2859598.0, 464899.0, 64102.0, 14547.0, 4264.0, 1526.0, 591.0, 257.0, 105.0, 87.0, 40.0, 36.0, 28.0, 25.0, 14.0, 8.0, 8.0, 10.0, 5.0, 7.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.640625, -10.322265625, -10.00390625, -9.685546875, -9.3671875, -9.048828125, -8.73046875, -8.412109375, -8.09375, -7.775390625, -7.45703125, -7.138671875, -6.8203125, -6.501953125, -6.18359375, -5.865234375, -5.546875, -5.228515625, -4.91015625, -4.591796875, -4.2734375, -3.955078125, -3.63671875, -3.318359375, -3.0, -2.681640625, -2.36328125, -2.044921875, -1.7265625, -1.408203125, -1.08984375, -0.771484375, -0.453125, -0.134765625, 0.18359375, 0.501953125, 0.8203125, 1.138671875, 1.45703125, 1.775390625, 2.09375, 2.412109375, 2.73046875, 3.048828125, 3.3671875, 3.685546875, 4.00390625, 4.322265625, 4.640625, 4.958984375, 5.27734375, 5.595703125, 5.9140625, 6.232421875, 6.55078125, 6.869140625, 7.1875, 7.505859375, 7.82421875, 8.142578125, 8.4609375, 8.779296875, 9.09765625, 9.416015625, 9.734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 8.0, 13.0, 19.0, 24.0, 29.0, 32.0, 66.0, 83.0, 117.0, 180.0, 261.0, 410.0, 553.0, 590.0, 495.0, 347.0, 239.0, 172.0, 123.0, 84.0, 51.0, 53.0, 37.0, 22.0, 12.0, 9.0, 10.0, 3.0, 4.0, 6.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9609375, -6.7154541015625, -6.469970703125, -6.2244873046875, -5.97900390625, -5.7335205078125, -5.488037109375, -5.2425537109375, -4.9970703125, -4.7515869140625, -4.506103515625, -4.2606201171875, -4.01513671875, -3.7696533203125, -3.524169921875, -3.2786865234375, -3.033203125, -2.7877197265625, -2.542236328125, -2.2967529296875, -2.05126953125, -1.8057861328125, -1.560302734375, -1.3148193359375, -1.0693359375, -0.8238525390625, -0.578369140625, -0.3328857421875, -0.08740234375, 0.1580810546875, 0.403564453125, 0.6490478515625, 0.89453125, 1.1400146484375, 1.385498046875, 1.6309814453125, 1.87646484375, 2.1219482421875, 2.367431640625, 2.6129150390625, 2.8583984375, 3.1038818359375, 3.349365234375, 3.5948486328125, 3.84033203125, 4.0858154296875, 4.331298828125, 4.5767822265625, 4.822265625, 5.0677490234375, 5.313232421875, 5.5587158203125, 5.80419921875, 6.0496826171875, 6.295166015625, 6.5406494140625, 6.7861328125, 7.0316162109375, 7.277099609375, 7.5225830078125, 7.76806640625, 8.0135498046875, 8.259033203125, 8.5045166015625, 8.75]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 12.0, 6.0, 29.0, 44.0, 60.0, 81.0, 126.0, 188.0, 348.0, 913.0, 5473.0, 213276.0, 3885459.0, 83380.0, 3452.0, 672.0, 308.0, 155.0, 99.0, 61.0, 38.0, 30.0, 16.0, 16.0, 10.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5625, -40.451171875, -39.33984375, -38.228515625, -37.1171875, -36.005859375, -34.89453125, -33.783203125, -32.671875, -31.560546875, -30.44921875, -29.337890625, -28.2265625, -27.115234375, -26.00390625, -24.892578125, -23.78125, -22.669921875, -21.55859375, -20.447265625, -19.3359375, -18.224609375, -17.11328125, -16.001953125, -14.890625, -13.779296875, -12.66796875, -11.556640625, -10.4453125, -9.333984375, -8.22265625, -7.111328125, -6.0, -4.888671875, -3.77734375, -2.666015625, -1.5546875, -0.443359375, 0.66796875, 1.779296875, 2.890625, 4.001953125, 5.11328125, 6.224609375, 7.3359375, 8.447265625, 9.55859375, 10.669921875, 11.78125, 12.892578125, 14.00390625, 15.115234375, 16.2265625, 17.337890625, 18.44921875, 19.560546875, 20.671875, 21.783203125, 22.89453125, 24.005859375, 25.1171875, 26.228515625, 27.33984375, 28.451171875, 29.5625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 21.0, 63.0, 169.0, 267.0, 245.0, 161.0, 60.0, 17.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.76300811767578, -110.67594909667969, -107.58889770507812, -104.50183868408203, -101.41477966308594, -98.32772827148438, -95.24066925048828, -92.15361022949219, -89.06655883789062, -85.97949981689453, -82.89244842529297, -79.80538940429688, -76.71833038330078, -73.63127136230469, -70.54421997070312, -67.45716094970703, -64.37010192871094, -61.28304672241211, -58.195987701416016, -55.10893249511719, -52.021873474121094, -48.934818267822266, -45.84776306152344, -42.760704040527344, -39.673648834228516, -36.58659362792969, -33.499534606933594, -30.412479400634766, -27.325422286987305, -24.238365173339844, -21.151309967041016, -18.064252853393555, -14.977195739746094, -11.890138626098633, -8.803082466125488, -5.716026306152344, -2.628969192504883, 0.4580879211425781, 3.5451431274414062, 6.632200241088867, 9.719257354736328, 12.806314468383789, 15.893370628356934, 18.980426788330078, 22.06748390197754, 25.154541015625, 28.241596221923828, 31.32865333557129, 34.41571044921875, 37.50276565551758, 40.58982467651367, 43.6768798828125, 46.763938903808594, 49.85099411010742, 52.93804931640625, 56.025108337402344, 59.11216354370117, 62.19921875, 65.2862777709961, 68.37333679199219, 71.46038818359375, 74.54744720458984, 77.63450622558594, 80.7215576171875, 83.8086166381836]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 11.0, 6.0, 9.0, 18.0, 14.0, 14.0, 31.0, 16.0, 24.0, 10.0, 29.0, 26.0, 38.0, 32.0, 28.0, 42.0, 30.0, 27.0, 44.0, 50.0, 35.0, 43.0, 34.0, 36.0, 42.0, 32.0, 36.0, 32.0, 28.0, 19.0, 16.0, 17.0, 21.0, 17.0, 19.0, 12.0, 14.0, 10.0, 7.0, 7.0, 1.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.699356079101562, -19.03421974182129, -18.369081497192383, -17.70394515991211, -17.038806915283203, -16.37367057800293, -15.708534240722656, -15.043396949768066, -14.378259658813477, -13.713122367858887, -13.047985076904297, -12.382848739624023, -11.717711448669434, -11.052574157714844, -10.38743782043457, -9.72230052947998, -9.05716323852539, -8.3920259475708, -7.726889133453369, -7.0617523193359375, -6.396615028381348, -5.731477737426758, -5.066340923309326, -4.4012041091918945, -3.7360668182373047, -3.070929765701294, -2.405792713165283, -1.7406556606292725, -1.0755186080932617, -0.410381555557251, 0.25475549697875977, 0.9198923110961914, 1.5850296020507812, 2.250166654586792, 2.9153037071228027, 3.5804407596588135, 4.245577812194824, 4.910715103149414, 5.575851917266846, 6.240988731384277, 6.906126022338867, 7.571263313293457, 8.236400604248047, 8.90153694152832, 9.56667423248291, 10.2318115234375, 10.896947860717773, 11.562085151672363, 12.227222442626953, 12.892359733581543, 13.557497024536133, 14.222633361816406, 14.887770652770996, 15.552907943725586, 16.21804428100586, 16.883182525634766, 17.54831886291504, 18.213455200195312, 18.87859344482422, 19.543729782104492, 20.208866119384766, 20.874004364013672, 21.539140701293945, 22.20427703857422, 22.869415283203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 4.0, 6.0, 11.0, 6.0, 9.0, 13.0, 10.0, 21.0, 24.0, 20.0, 32.0, 28.0, 35.0, 41.0, 44.0, 35.0, 51.0, 44.0, 36.0, 42.0, 46.0, 40.0, 34.0, 32.0, 34.0, 44.0, 26.0, 35.0, 18.0, 28.0, 27.0, 19.0, 20.0, 16.0, 8.0, 14.0, 8.0, 4.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.784576416015625, -3.66876220703125, -3.552947998046875, -3.4371337890625, -3.321319580078125, -3.20550537109375, -3.089691162109375, -2.973876953125, -2.858062744140625, -2.74224853515625, -2.626434326171875, -2.5106201171875, -2.394805908203125, -2.27899169921875, -2.163177490234375, -2.04736328125, -1.931549072265625, -1.81573486328125, -1.699920654296875, -1.5841064453125, -1.468292236328125, -1.35247802734375, -1.236663818359375, -1.120849609375, -1.005035400390625, -0.88922119140625, -0.773406982421875, -0.6575927734375, -0.541778564453125, -0.42596435546875, -0.310150146484375, -0.1943359375, -0.078521728515625, 0.03729248046875, 0.153106689453125, 0.2689208984375, 0.384735107421875, 0.50054931640625, 0.616363525390625, 0.732177734375, 0.847991943359375, 0.96380615234375, 1.079620361328125, 1.1954345703125, 1.311248779296875, 1.42706298828125, 1.542877197265625, 1.65869140625, 1.774505615234375, 1.89031982421875, 2.006134033203125, 2.1219482421875, 2.237762451171875, 2.35357666015625, 2.469390869140625, 2.585205078125, 2.701019287109375, 2.81683349609375, 2.932647705078125, 3.0484619140625, 3.164276123046875, 3.28009033203125, 3.395904541015625, 3.51171875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 6.0, 9.0, 17.0, 16.0, 26.0, 41.0, 57.0, 79.0, 127.0, 159.0, 239.0, 370.0, 488.0, 743.0, 1033.0, 1481.0, 2274.0, 3211.0, 4737.0, 7046.0, 10712.0, 16083.0, 24886.0, 39599.0, 65393.0, 116554.0, 295462.0, 205480.0, 96353.0, 56093.0, 34470.0, 21766.0, 14362.0, 9473.0, 6231.0, 4260.0, 2826.0, 1995.0, 1339.0, 950.0, 677.0, 439.0, 299.0, 197.0, 152.0, 111.0, 71.0, 61.0, 33.0, 28.0, 14.0, 13.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.255615234375, -0.2473297119140625, -0.239044189453125, -0.2307586669921875, -0.22247314453125, -0.2141876220703125, -0.205902099609375, -0.1976165771484375, -0.1893310546875, -0.1810455322265625, -0.172760009765625, -0.1644744873046875, -0.15618896484375, -0.1479034423828125, -0.139617919921875, -0.1313323974609375, -0.123046875, -0.1147613525390625, -0.106475830078125, -0.0981903076171875, -0.08990478515625, -0.0816192626953125, -0.073333740234375, -0.0650482177734375, -0.0567626953125, -0.0484771728515625, -0.040191650390625, -0.0319061279296875, -0.02362060546875, -0.0153350830078125, -0.007049560546875, 0.0012359619140625, 0.009521484375, 0.0178070068359375, 0.026092529296875, 0.0343780517578125, 0.04266357421875, 0.0509490966796875, 0.059234619140625, 0.0675201416015625, 0.0758056640625, 0.0840911865234375, 0.092376708984375, 0.1006622314453125, 0.10894775390625, 0.1172332763671875, 0.125518798828125, 0.1338043212890625, 0.14208984375, 0.1503753662109375, 0.158660888671875, 0.1669464111328125, 0.17523193359375, 0.1835174560546875, 0.191802978515625, 0.2000885009765625, 0.2083740234375, 0.2166595458984375, 0.224945068359375, 0.2332305908203125, 0.24151611328125, 0.2498016357421875, 0.258087158203125, 0.2663726806640625, 0.274658203125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 5.0, 8.0, 7.0, 13.0, 12.0, 16.0, 18.0, 17.0, 22.0, 17.0, 26.0, 38.0, 22.0, 31.0, 35.0, 31.0, 33.0, 40.0, 43.0, 1074.0, 40.0, 55.0, 47.0, 34.0, 33.0, 29.0, 41.0, 26.0, 24.0, 28.0, 22.0, 26.0, 14.0, 13.0, 8.0, 18.0, 13.0, 9.0, 10.0, 8.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.10357666015625, -2.0255126953125, -1.94744873046875, -1.869384765625, -1.79132080078125, -1.7132568359375, -1.63519287109375, -1.55712890625, -1.47906494140625, -1.4010009765625, -1.32293701171875, -1.244873046875, -1.16680908203125, -1.0887451171875, -1.01068115234375, -0.9326171875, -0.85455322265625, -0.7764892578125, -0.69842529296875, -0.620361328125, -0.54229736328125, -0.4642333984375, -0.38616943359375, -0.30810546875, -0.23004150390625, -0.1519775390625, -0.07391357421875, 0.004150390625, 0.08221435546875, 0.1602783203125, 0.23834228515625, 0.31640625, 0.39447021484375, 0.4725341796875, 0.55059814453125, 0.628662109375, 0.70672607421875, 0.7847900390625, 0.86285400390625, 0.94091796875, 1.01898193359375, 1.0970458984375, 1.17510986328125, 1.253173828125, 1.33123779296875, 1.4093017578125, 1.48736572265625, 1.5654296875, 1.64349365234375, 1.7215576171875, 1.79962158203125, 1.877685546875, 1.95574951171875, 2.0338134765625, 2.11187744140625, 2.18994140625, 2.26800537109375, 2.3460693359375, 2.42413330078125, 2.502197265625, 2.58026123046875, 2.6583251953125, 2.73638916015625, 2.814453125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 9.0, 8.0, 16.0, 19.0, 36.0, 57.0, 75.0, 112.0, 173.0, 245.0, 422.0, 599.0, 945.0, 1446.0, 2241.0, 3482.0, 5517.0, 8806.0, 14260.0, 23905.0, 41816.0, 77125.0, 172529.0, 1450502.0, 135591.0, 65814.0, 36086.0, 20950.0, 12726.0, 7886.0, 4832.0, 3160.0, 2069.0, 1252.0, 838.0, 518.0, 395.0, 221.0, 158.0, 100.0, 63.0, 51.0, 27.0, 13.0, 12.0, 14.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.18896484375, -0.18346786499023438, -0.17797088623046875, -0.17247390747070312, -0.1669769287109375, -0.16147994995117188, -0.15598297119140625, -0.15048599243164062, -0.144989013671875, -0.13949203491210938, -0.13399505615234375, -0.12849807739257812, -0.1230010986328125, -0.11750411987304688, -0.11200714111328125, -0.10651016235351562, -0.10101318359375, -0.09551620483398438, -0.09001922607421875, -0.08452224731445312, -0.0790252685546875, -0.07352828979492188, -0.06803131103515625, -0.06253433227539062, -0.057037353515625, -0.051540374755859375, -0.04604339599609375, -0.040546417236328125, -0.0350494384765625, -0.029552459716796875, -0.02405548095703125, -0.018558502197265625, -0.0130615234375, -0.007564544677734375, -0.00206756591796875, 0.003429412841796875, 0.0089263916015625, 0.014423370361328125, 0.01992034912109375, 0.025417327880859375, 0.030914306640625, 0.036411285400390625, 0.04190826416015625, 0.047405242919921875, 0.0529022216796875, 0.058399200439453125, 0.06389617919921875, 0.06939315795898438, 0.07489013671875, 0.08038711547851562, 0.08588409423828125, 0.09138107299804688, 0.0968780517578125, 0.10237503051757812, 0.10787200927734375, 0.11336898803710938, 0.118865966796875, 0.12436294555664062, 0.12985992431640625, 0.13535690307617188, 0.1408538818359375, 0.14635086059570312, 0.15184783935546875, 0.15734481811523438, 0.162841796875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 10.0, 8.0, 11.0, 11.0, 22.0, 22.0, 28.0, 38.0, 43.0, 77.0, 95.0, 136.0, 141.0, 100.0, 67.0, 43.0, 24.0, 22.0, 28.0, 14.0, 8.0, 7.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4126300811767578e-05, -1.3532117009162903e-05, -1.2937933206558228e-05, -1.2343749403953552e-05, -1.1749565601348877e-05, -1.1155381798744202e-05, -1.0561197996139526e-05, -9.967014193534851e-06, -9.372830390930176e-06, -8.7786465883255e-06, -8.184462785720825e-06, -7.59027898311615e-06, -6.996095180511475e-06, -6.401911377906799e-06, -5.807727575302124e-06, -5.213543772697449e-06, -4.6193599700927734e-06, -4.025176167488098e-06, -3.430992364883423e-06, -2.8368085622787476e-06, -2.2426247596740723e-06, -1.648440957069397e-06, -1.0542571544647217e-06, -4.600733518600464e-07, 1.341104507446289e-07, 7.282942533493042e-07, 1.3224780559539795e-06, 1.9166618585586548e-06, 2.51084566116333e-06, 3.1050294637680054e-06, 3.6992132663726807e-06, 4.293397068977356e-06, 4.887580871582031e-06, 5.4817646741867065e-06, 6.075948476791382e-06, 6.670132279396057e-06, 7.264316082000732e-06, 7.858499884605408e-06, 8.452683687210083e-06, 9.046867489814758e-06, 9.641051292419434e-06, 1.0235235095024109e-05, 1.0829418897628784e-05, 1.142360270023346e-05, 1.2017786502838135e-05, 1.261197030544281e-05, 1.3206154108047485e-05, 1.380033791065216e-05, 1.4394521713256836e-05, 1.4988705515861511e-05, 1.5582889318466187e-05, 1.6177073121070862e-05, 1.6771256923675537e-05, 1.7365440726280212e-05, 1.7959624528884888e-05, 1.8553808331489563e-05, 1.9147992134094238e-05, 1.9742175936698914e-05, 2.033635973930359e-05, 2.0930543541908264e-05, 2.152472734451294e-05, 2.2118911147117615e-05, 2.271309494972229e-05, 2.3307278752326965e-05, 2.390146255493164e-05]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 6.0, 14.0, 10.0, 15.0, 24.0, 35.0, 45.0, 71.0, 232.0, 1177.0, 16324.0, 825630.0, 197919.0, 5977.0, 645.0, 186.0, 80.0, 47.0, 23.0, 16.0, 15.0, 7.0, 11.0, 9.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003914833068847656, -0.0003808550536632538, -0.00037022680044174194, -0.0003595985472202301, -0.00034897029399871826, -0.0003383420407772064, -0.0003277137875556946, -0.00031708553433418274, -0.0003064572811126709, -0.00029582902789115906, -0.0002852007746696472, -0.0002745725214481354, -0.00026394426822662354, -0.0002533160150051117, -0.00024268776178359985, -0.000232059508562088, -0.00022143125534057617, -0.00021080300211906433, -0.0002001747488975525, -0.00018954649567604065, -0.0001789182424545288, -0.00016828998923301697, -0.00015766173601150513, -0.00014703348278999329, -0.00013640522956848145, -0.0001257769763469696, -0.00011514872312545776, -0.00010452046990394592, -9.389221668243408e-05, -8.326396346092224e-05, -7.26357102394104e-05, -6.200745701789856e-05, -5.137920379638672e-05, -4.075095057487488e-05, -3.0122697353363037e-05, -1.9494444131851196e-05, -8.866190910339355e-06, 1.7620623111724854e-06, 1.2390315532684326e-05, 2.3018568754196167e-05, 3.364682197570801e-05, 4.427507519721985e-05, 5.490332841873169e-05, 6.553158164024353e-05, 7.615983486175537e-05, 8.678808808326721e-05, 9.741634130477905e-05, 0.0001080445945262909, 0.00011867284774780273, 0.00012930110096931458, 0.00013992935419082642, 0.00015055760741233826, 0.0001611858606338501, 0.00017181411385536194, 0.00018244236707687378, 0.00019307062029838562, 0.00020369887351989746, 0.0002143271267414093, 0.00022495537996292114, 0.00023558363318443298, 0.0002462118864059448, 0.00025684013962745667, 0.0002674683928489685, 0.00027809664607048035, 0.0002887248992919922]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 16.0, 43.0, 117.0, 178.0, 266.0, 221.0, 96.0, 41.0, 19.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.423531193722738e-05, -1.3010080692765769e-05, -1.178485035779886e-05, -1.0559619113337249e-05, -9.334387868875638e-06, -8.109157533908729e-06, -6.883926289447118e-06, -5.6586959544802085e-06, -4.4334647100185975e-06, -3.2082339203043375e-06, -1.983002903216402e-06, -7.577718861284666e-07, 4.6745890358579345e-07, 1.6926896933000535e-06, 2.9179209377616644e-06, 4.1431512727285735e-06, 5.3683825171901844e-06, 6.5936133069044445e-06, 7.818844096618704e-06, 9.044075341080315e-06, 1.0269306585541926e-05, 1.1494536920508835e-05, 1.2719768164970446e-05, 1.3944998499937356e-05, 1.5170229744398966e-05, 1.6395460988860577e-05, 1.7620692233322188e-05, 1.88459234777838e-05, 2.0071152903256007e-05, 2.1296384147717617e-05, 2.252161539217923e-05, 2.3746844817651436e-05, 2.4972079700091854e-05, 2.6197310944553465e-05, 2.7422542189015076e-05, 2.8647773433476686e-05, 2.9873002858948894e-05, 3.109823592239991e-05, 3.232346352888271e-05, 3.354869477334432e-05, 3.4773926017805934e-05, 3.5999157262267545e-05, 3.7224388506729156e-05, 3.844961975119077e-05, 3.967485099565238e-05, 4.090007860213518e-05, 4.21253134845756e-05, 4.33505410910584e-05, 4.457577597349882e-05, 4.580100721796043e-05, 4.702623846242204e-05, 4.8251469706883654e-05, 4.9476700951345265e-05, 5.070192855782807e-05, 5.192716344026849e-05, 5.315239104675129e-05, 5.43776222912129e-05, 5.560285353567451e-05, 5.682808478013612e-05, 5.8053316024597734e-05, 5.9278547269059345e-05, 6.0503778513520956e-05, 6.172900612000376e-05, 6.295424100244418e-05, 6.417946860892698e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 9.0, 7.0, 16.0, 18.0, 16.0, 17.0, 28.0, 14.0, 33.0, 30.0, 18.0, 24.0, 39.0, 27.0, 49.0, 22.0, 39.0, 43.0, 34.0, 45.0, 45.0, 37.0, 45.0, 47.0, 21.0, 27.0, 38.0, 24.0, 28.0, 34.0, 16.0, 15.0, 21.0, 13.0, 13.0, 6.0, 8.0, 7.0, 8.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.569789886474609e-06, -7.351860404014587e-06, -7.1339309215545654e-06, -6.9160014390945435e-06, -6.6980719566345215e-06, -6.4801424741744995e-06, -6.2622129917144775e-06, -6.0442835092544556e-06, -5.826354026794434e-06, -5.608424544334412e-06, -5.39049506187439e-06, -5.172565579414368e-06, -4.954636096954346e-06, -4.736706614494324e-06, -4.518777132034302e-06, -4.30084764957428e-06, -4.082918167114258e-06, -3.864988684654236e-06, -3.647059202194214e-06, -3.429129719734192e-06, -3.21120023727417e-06, -2.993270754814148e-06, -2.775341272354126e-06, -2.557411789894104e-06, -2.339482307434082e-06, -2.12155282497406e-06, -1.903623342514038e-06, -1.6856938600540161e-06, -1.4677643775939941e-06, -1.2498348951339722e-06, -1.0319054126739502e-06, -8.139759302139282e-07, -5.960464477539062e-07, -3.781169652938843e-07, -1.601874828338623e-07, 5.774199962615967e-08, 2.7567148208618164e-07, 4.936009645462036e-07, 7.115304470062256e-07, 9.294599294662476e-07, 1.1473894119262695e-06, 1.3653188943862915e-06, 1.5832483768463135e-06, 1.8011778593063354e-06, 2.0191073417663574e-06, 2.2370368242263794e-06, 2.4549663066864014e-06, 2.6728957891464233e-06, 2.8908252716064453e-06, 3.1087547540664673e-06, 3.3266842365264893e-06, 3.5446137189865112e-06, 3.762543201446533e-06, 3.980472683906555e-06, 4.198402166366577e-06, 4.416331648826599e-06, 4.634261131286621e-06, 4.852190613746643e-06, 5.070120096206665e-06, 5.288049578666687e-06, 5.505979061126709e-06, 5.723908543586731e-06, 5.941838026046753e-06, 6.159767508506775e-06, 6.377696990966797e-06]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 4.0, 6.0, 11.0, 6.0, 9.0, 13.0, 10.0, 21.0, 24.0, 20.0, 32.0, 28.0, 35.0, 41.0, 44.0, 35.0, 51.0, 44.0, 36.0, 42.0, 46.0, 40.0, 34.0, 32.0, 34.0, 44.0, 26.0, 35.0, 18.0, 28.0, 27.0, 19.0, 20.0, 16.0, 8.0, 14.0, 8.0, 4.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.784576416015625, -3.66876220703125, -3.552947998046875, -3.4371337890625, -3.321319580078125, -3.20550537109375, -3.089691162109375, -2.973876953125, -2.858062744140625, -2.74224853515625, -2.626434326171875, -2.5106201171875, -2.394805908203125, -2.27899169921875, -2.163177490234375, -2.04736328125, -1.931549072265625, -1.81573486328125, -1.699920654296875, -1.5841064453125, -1.468292236328125, -1.35247802734375, -1.236663818359375, -1.120849609375, -1.005035400390625, -0.88922119140625, -0.773406982421875, -0.6575927734375, -0.541778564453125, -0.42596435546875, -0.310150146484375, -0.1943359375, -0.078521728515625, 0.03729248046875, 0.153106689453125, 0.2689208984375, 0.384735107421875, 0.50054931640625, 0.616363525390625, 0.732177734375, 0.847991943359375, 0.96380615234375, 1.079620361328125, 1.1954345703125, 1.311248779296875, 1.42706298828125, 1.542877197265625, 1.65869140625, 1.774505615234375, 1.89031982421875, 2.006134033203125, 2.1219482421875, 2.237762451171875, 2.35357666015625, 2.469390869140625, 2.585205078125, 2.701019287109375, 2.81683349609375, 2.932647705078125, 3.0484619140625, 3.164276123046875, 3.28009033203125, 3.395904541015625, 3.51171875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 17.0, 14.0, 20.0, 34.0, 42.0, 61.0, 95.0, 145.0, 202.0, 336.0, 524.0, 894.0, 1450.0, 2557.0, 4250.0, 7498.0, 13349.0, 24121.0, 44254.0, 85108.0, 171769.0, 304380.0, 187018.0, 92543.0, 48166.0, 25895.0, 14435.0, 7918.0, 4520.0, 2714.0, 1512.0, 947.0, 636.0, 355.0, 248.0, 187.0, 110.0, 69.0, 40.0, 39.0, 26.0, 25.0, 8.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.392578125, -3.28839111328125, -3.1842041015625, -3.08001708984375, -2.975830078125, -2.87164306640625, -2.7674560546875, -2.66326904296875, -2.55908203125, -2.45489501953125, -2.3507080078125, -2.24652099609375, -2.142333984375, -2.03814697265625, -1.9339599609375, -1.82977294921875, -1.7255859375, -1.62139892578125, -1.5172119140625, -1.41302490234375, -1.308837890625, -1.20465087890625, -1.1004638671875, -0.99627685546875, -0.89208984375, -0.78790283203125, -0.6837158203125, -0.57952880859375, -0.475341796875, -0.37115478515625, -0.2669677734375, -0.16278076171875, -0.05859375, 0.04559326171875, 0.1497802734375, 0.25396728515625, 0.358154296875, 0.46234130859375, 0.5665283203125, 0.67071533203125, 0.77490234375, 0.87908935546875, 0.9832763671875, 1.08746337890625, 1.191650390625, 1.29583740234375, 1.4000244140625, 1.50421142578125, 1.6083984375, 1.71258544921875, 1.8167724609375, 1.92095947265625, 2.025146484375, 2.12933349609375, 2.2335205078125, 2.33770751953125, 2.44189453125, 2.54608154296875, 2.6502685546875, 2.75445556640625, 2.858642578125, 2.96282958984375, 3.0670166015625, 3.17120361328125, 3.275390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 6.0, 11.0, 7.0, 14.0, 23.0, 18.0, 28.0, 23.0, 28.0, 28.0, 28.0, 37.0, 55.0, 49.0, 59.0, 110.0, 328.0, 1630.0, 144.0, 57.0, 51.0, 49.0, 30.0, 40.0, 25.0, 28.0, 22.0, 21.0, 15.0, 16.0, 19.0, 9.0, 11.0, 4.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.2109375, -14.8126220703125, -14.414306640625, -14.0159912109375, -13.61767578125, -13.2193603515625, -12.821044921875, -12.4227294921875, -12.0244140625, -11.6260986328125, -11.227783203125, -10.8294677734375, -10.43115234375, -10.0328369140625, -9.634521484375, -9.2362060546875, -8.837890625, -8.4395751953125, -8.041259765625, -7.6429443359375, -7.24462890625, -6.8463134765625, -6.447998046875, -6.0496826171875, -5.6513671875, -5.2530517578125, -4.854736328125, -4.4564208984375, -4.05810546875, -3.6597900390625, -3.261474609375, -2.8631591796875, -2.46484375, -2.0665283203125, -1.668212890625, -1.2698974609375, -0.87158203125, -0.4732666015625, -0.074951171875, 0.3233642578125, 0.7216796875, 1.1199951171875, 1.518310546875, 1.9166259765625, 2.31494140625, 2.7132568359375, 3.111572265625, 3.5098876953125, 3.908203125, 4.3065185546875, 4.704833984375, 5.1031494140625, 5.50146484375, 5.8997802734375, 6.298095703125, 6.6964111328125, 7.0947265625, 7.4930419921875, 7.891357421875, 8.2896728515625, 8.68798828125, 9.0863037109375, 9.484619140625, 9.8829345703125, 10.28125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 3.0, 1.0, 9.0, 10.0, 9.0, 21.0, 19.0, 24.0, 32.0, 35.0, 75.0, 67.0, 99.0, 109.0, 176.0, 302.0, 449.0, 1698.0, 33660.0, 2880507.0, 221422.0, 5074.0, 717.0, 330.0, 212.0, 147.0, 108.0, 82.0, 71.0, 49.0, 40.0, 39.0, 25.0, 20.0, 20.0, 9.0, 7.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.703125, -17.04052734375, -16.3779296875, -15.71533203125, -15.052734375, -14.39013671875, -13.7275390625, -13.06494140625, -12.40234375, -11.73974609375, -11.0771484375, -10.41455078125, -9.751953125, -9.08935546875, -8.4267578125, -7.76416015625, -7.1015625, -6.43896484375, -5.7763671875, -5.11376953125, -4.451171875, -3.78857421875, -3.1259765625, -2.46337890625, -1.80078125, -1.13818359375, -0.4755859375, 0.18701171875, 0.849609375, 1.51220703125, 2.1748046875, 2.83740234375, 3.5, 4.16259765625, 4.8251953125, 5.48779296875, 6.150390625, 6.81298828125, 7.4755859375, 8.13818359375, 8.80078125, 9.46337890625, 10.1259765625, 10.78857421875, 11.451171875, 12.11376953125, 12.7763671875, 13.43896484375, 14.1015625, 14.76416015625, 15.4267578125, 16.08935546875, 16.751953125, 17.41455078125, 18.0771484375, 18.73974609375, 19.40234375, 20.06494140625, 20.7275390625, 21.39013671875, 22.052734375, 22.71533203125, 23.3779296875, 24.04052734375, 24.703125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [5.0, 20.0, 89.0, 257.0, 360.0, 190.0, 75.0, 21.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6989922523498535, -5.203291416168213, -3.707590341567993, -2.2118892669677734, -0.7161884307861328, 0.7795124053955078, 2.2752137184143066, 3.7709145545959473, 5.266615390777588, 6.7623162269592285, 8.258017539978027, 9.753718376159668, 11.249419212341309, 12.74512004852295, 14.240821838378906, 15.736522674560547, 17.232223510742188, 18.727924346923828, 20.22362518310547, 21.71932601928711, 23.21502685546875, 24.71072769165039, 26.20642852783203, 27.702129364013672, 29.197830200195312, 30.693531036376953, 32.189231872558594, 33.684932708740234, 35.180633544921875, 36.676334381103516, 38.172035217285156, 39.6677360534668, 41.1634407043457, 42.659141540527344, 44.154842376708984, 45.650543212890625, 47.146244049072266, 48.641944885253906, 50.13764572143555, 51.63334655761719, 53.12904739379883, 54.62474822998047, 56.12044906616211, 57.61614990234375, 59.11185073852539, 60.60755157470703, 62.10325241088867, 63.59895324707031, 65.09465789794922, 66.59036254882812, 68.0860595703125, 69.5817642211914, 71.07746124267578, 72.57316589355469, 74.06886291503906, 75.56456756591797, 77.06026458740234, 78.55596923828125, 80.05166625976562, 81.54737091064453, 83.0430679321289, 84.53877258300781, 86.03446960449219, 87.5301742553711, 89.02587127685547]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 10.0, 6.0, 15.0, 7.0, 10.0, 14.0, 30.0, 13.0, 27.0, 29.0, 25.0, 24.0, 39.0, 22.0, 35.0, 51.0, 38.0, 55.0, 41.0, 50.0, 46.0, 44.0, 42.0, 30.0, 42.0, 38.0, 33.0, 29.0, 23.0, 18.0, 17.0, 11.0, 19.0, 10.0, 12.0, 5.0, 6.0, 9.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.839984893798828, -28.81067657470703, -27.781370162963867, -26.75206184387207, -25.722755432128906, -24.69344711303711, -23.664138793945312, -22.634830474853516, -21.60552406311035, -20.576215744018555, -19.54690933227539, -18.517601013183594, -17.488292694091797, -16.458986282348633, -15.429677963256836, -14.400370597839355, -13.371063232421875, -12.341755867004395, -11.312448501586914, -10.283140182495117, -9.253832817077637, -8.224525451660156, -7.195217609405518, -6.165909767150879, -5.136602401733398, -4.107295036315918, -3.0779871940612793, -2.0486795902252197, -1.0193719863891602, 0.009935379028320312, 1.039243221282959, 2.0685510635375977, 3.0978622436523438, 4.127169609069824, 5.156477451324463, 6.185785293579102, 7.215092658996582, 8.244400024414062, 9.27370834350586, 10.30301570892334, 11.33232307434082, 12.3616304397583, 13.390937805175781, 14.420246124267578, 15.449553489685059, 16.47886085510254, 17.508169174194336, 18.5374755859375, 19.566783905029297, 20.596092224121094, 21.625398635864258, 22.654706954956055, 23.68401336669922, 24.713321685791016, 25.742630004882812, 26.77193832397461, 27.801244735717773, 28.83055305480957, 29.859859466552734, 30.88916778564453, 31.918476104736328, 32.947784423828125, 33.977088928222656, 35.00639724731445, 36.03570556640625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 1.0, 6.0, 9.0, 11.0, 9.0, 12.0, 13.0, 14.0, 23.0, 28.0, 23.0, 33.0, 32.0, 35.0, 43.0, 45.0, 45.0, 38.0, 42.0, 43.0, 44.0, 34.0, 33.0, 33.0, 34.0, 53.0, 27.0, 32.0, 20.0, 20.0, 25.0, 20.0, 20.0, 20.0, 12.0, 14.0, 7.0, 9.0, 4.0, 7.0, 6.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.1015625, -3.984100341796875, -3.86663818359375, -3.749176025390625, -3.6317138671875, -3.514251708984375, -3.39678955078125, -3.279327392578125, -3.161865234375, -3.044403076171875, -2.92694091796875, -2.809478759765625, -2.6920166015625, -2.574554443359375, -2.45709228515625, -2.339630126953125, -2.22216796875, -2.104705810546875, -1.98724365234375, -1.869781494140625, -1.7523193359375, -1.634857177734375, -1.51739501953125, -1.399932861328125, -1.282470703125, -1.165008544921875, -1.04754638671875, -0.930084228515625, -0.8126220703125, -0.695159912109375, -0.57769775390625, -0.460235595703125, -0.3427734375, -0.225311279296875, -0.10784912109375, 0.009613037109375, 0.1270751953125, 0.244537353515625, 0.36199951171875, 0.479461669921875, 0.596923828125, 0.714385986328125, 0.83184814453125, 0.949310302734375, 1.0667724609375, 1.184234619140625, 1.30169677734375, 1.419158935546875, 1.53662109375, 1.654083251953125, 1.77154541015625, 1.889007568359375, 2.0064697265625, 2.123931884765625, 2.24139404296875, 2.358856201171875, 2.476318359375, 2.593780517578125, 2.71124267578125, 2.828704833984375, 2.9461669921875, 3.063629150390625, 3.18109130859375, 3.298553466796875, 3.416015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 13.0, 13.0, 25.0, 33.0, 37.0, 47.0, 68.0, 127.0, 172.0, 264.0, 462.0, 823.0, 1758.0, 3926.0, 9843.0, 29423.0, 110226.0, 643879.0, 2594711.0, 640191.0, 111120.0, 29665.0, 9908.0, 3860.0, 1724.0, 775.0, 433.0, 258.0, 134.0, 122.0, 78.0, 50.0, 19.0, 21.0, 16.0, 17.0, 10.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.24603271484375, -7.9998779296875, -7.75372314453125, -7.507568359375, -7.26141357421875, -7.0152587890625, -6.76910400390625, -6.52294921875, -6.27679443359375, -6.0306396484375, -5.78448486328125, -5.538330078125, -5.29217529296875, -5.0460205078125, -4.79986572265625, -4.5537109375, -4.30755615234375, -4.0614013671875, -3.81524658203125, -3.569091796875, -3.32293701171875, -3.0767822265625, -2.83062744140625, -2.58447265625, -2.33831787109375, -2.0921630859375, -1.84600830078125, -1.599853515625, -1.35369873046875, -1.1075439453125, -0.86138916015625, -0.615234375, -0.36907958984375, -0.1229248046875, 0.12322998046875, 0.369384765625, 0.61553955078125, 0.8616943359375, 1.10784912109375, 1.35400390625, 1.60015869140625, 1.8463134765625, 2.09246826171875, 2.338623046875, 2.58477783203125, 2.8309326171875, 3.07708740234375, 3.3232421875, 3.56939697265625, 3.8155517578125, 4.06170654296875, 4.307861328125, 4.55401611328125, 4.8001708984375, 5.04632568359375, 5.29248046875, 5.53863525390625, 5.7847900390625, 6.03094482421875, 6.277099609375, 6.52325439453125, 6.7694091796875, 7.01556396484375, 7.26171875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 7.0, 2.0, 5.0, 5.0, 12.0, 15.0, 15.0, 28.0, 32.0, 28.0, 37.0, 65.0, 69.0, 90.0, 139.0, 202.0, 225.0, 310.0, 391.0, 505.0, 493.0, 324.0, 278.0, 180.0, 149.0, 95.0, 79.0, 66.0, 53.0, 32.0, 32.0, 29.0, 28.0, 14.0, 18.0, 9.0, 10.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.72265625, -4.54583740234375, -4.3690185546875, -4.19219970703125, -4.015380859375, -3.83856201171875, -3.6617431640625, -3.48492431640625, -3.30810546875, -3.13128662109375, -2.9544677734375, -2.77764892578125, -2.600830078125, -2.42401123046875, -2.2471923828125, -2.07037353515625, -1.8935546875, -1.71673583984375, -1.5399169921875, -1.36309814453125, -1.186279296875, -1.00946044921875, -0.8326416015625, -0.65582275390625, -0.47900390625, -0.30218505859375, -0.1253662109375, 0.05145263671875, 0.228271484375, 0.40509033203125, 0.5819091796875, 0.75872802734375, 0.935546875, 1.11236572265625, 1.2891845703125, 1.46600341796875, 1.642822265625, 1.81964111328125, 1.9964599609375, 2.17327880859375, 2.35009765625, 2.52691650390625, 2.7037353515625, 2.88055419921875, 3.057373046875, 3.23419189453125, 3.4110107421875, 3.58782958984375, 3.7646484375, 3.94146728515625, 4.1182861328125, 4.29510498046875, 4.471923828125, 4.64874267578125, 4.8255615234375, 5.00238037109375, 5.17919921875, 5.35601806640625, 5.5328369140625, 5.70965576171875, 5.886474609375, 6.06329345703125, 6.2401123046875, 6.41693115234375, 6.59375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 6.0, 6.0, 19.0, 21.0, 31.0, 32.0, 35.0, 43.0, 71.0, 95.0, 106.0, 164.0, 234.0, 426.0, 1743.0, 19755.0, 882392.0, 3230888.0, 53228.0, 3345.0, 598.0, 313.0, 211.0, 143.0, 90.0, 63.0, 54.0, 42.0, 28.0, 32.0, 9.0, 11.0, 14.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-34.4375, -33.534912109375, -32.63232421875, -31.729736328125, -30.8271484375, -29.924560546875, -29.02197265625, -28.119384765625, -27.216796875, -26.314208984375, -25.41162109375, -24.509033203125, -23.6064453125, -22.703857421875, -21.80126953125, -20.898681640625, -19.99609375, -19.093505859375, -18.19091796875, -17.288330078125, -16.3857421875, -15.483154296875, -14.58056640625, -13.677978515625, -12.775390625, -11.872802734375, -10.97021484375, -10.067626953125, -9.1650390625, -8.262451171875, -7.35986328125, -6.457275390625, -5.5546875, -4.652099609375, -3.74951171875, -2.846923828125, -1.9443359375, -1.041748046875, -0.13916015625, 0.763427734375, 1.666015625, 2.568603515625, 3.47119140625, 4.373779296875, 5.2763671875, 6.178955078125, 7.08154296875, 7.984130859375, 8.88671875, 9.789306640625, 10.69189453125, 11.594482421875, 12.4970703125, 13.399658203125, 14.30224609375, 15.204833984375, 16.107421875, 17.010009765625, 17.91259765625, 18.815185546875, 19.7177734375, 20.620361328125, 21.52294921875, 22.425537109375, 23.328125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 11.0, 9.0, 20.0, 24.0, 30.0, 39.0, 45.0, 52.0, 59.0, 67.0, 85.0, 83.0, 70.0, 63.0, 62.0, 64.0, 50.0, 39.0, 35.0, 23.0, 19.0, 14.0, 12.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.238107681274414, -30.47184944152832, -29.705591201782227, -28.9393310546875, -28.173072814941406, -27.406814575195312, -26.64055633544922, -25.874298095703125, -25.10803985595703, -24.341781616210938, -23.575523376464844, -22.80926513671875, -22.043004989624023, -21.27674674987793, -20.510488510131836, -19.744230270385742, -18.977970123291016, -18.211711883544922, -17.445453643798828, -16.679195404052734, -15.912935256958008, -15.146677017211914, -14.38041877746582, -13.614160537719727, -12.847901344299316, -12.081643104553223, -11.315383911132812, -10.549125671386719, -9.782867431640625, -9.016608238220215, -8.250349998474121, -7.484091281890869, -6.717830657958984, -5.951571941375732, -5.1853132247924805, -4.419054985046387, -3.6527962684631348, -2.886537551879883, -2.120279312133789, -1.354020595550537, -0.5877618789672852, 0.17849671840667725, 0.9447553157806396, 1.7110137939453125, 2.4772725105285645, 3.2435312271118164, 4.00978946685791, 4.776048183441162, 5.542306900024414, 6.308565616607666, 7.074824333190918, 7.841082572937012, 8.607341766357422, 9.373600006103516, 10.13985824584961, 10.906116485595703, 11.672375679016113, 12.438633918762207, 13.204893112182617, 13.971151351928711, 14.737409591674805, 15.503668785095215, 16.269927978515625, 17.03618621826172, 17.802444458007812]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 8.0, 13.0, 9.0, 9.0, 17.0, 12.0, 9.0, 17.0, 17.0, 27.0, 35.0, 26.0, 35.0, 43.0, 37.0, 43.0, 36.0, 41.0, 46.0, 37.0, 41.0, 50.0, 44.0, 47.0, 36.0, 24.0, 31.0, 28.0, 35.0, 21.0, 15.0, 21.0, 24.0, 16.0, 11.0, 11.0, 7.0, 4.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.270782470703125, -20.618101119995117, -19.965421676635742, -19.312740325927734, -18.66006088256836, -18.00737953186035, -17.354700088500977, -16.70201873779297, -16.049339294433594, -15.396658897399902, -14.743978500366211, -14.09129810333252, -13.438617706298828, -12.78593635559082, -12.133255958557129, -11.480575561523438, -10.82789421081543, -10.175213813781738, -9.522533416748047, -8.869853019714355, -8.217172622680664, -7.5644917488098145, -6.911810874938965, -6.259130477905273, -5.606450080871582, -4.953769683837891, -4.301089286804199, -3.6484084129333496, -2.995728015899658, -2.343047618865967, -1.6903669834136963, -1.0376863479614258, -0.3850059509277344, 0.2676745653152466, 0.9203550815582275, 1.5730355978012085, 2.2257161140441895, 2.878396511077881, 3.5310771465301514, 4.183757781982422, 4.836438179016113, 5.489118576049805, 6.141798973083496, 6.794479846954346, 7.447160243988037, 8.09984016418457, 8.752521514892578, 9.40520191192627, 10.057882308959961, 10.710562705993652, 11.363243103027344, 12.015923500061035, 12.668603897094727, 13.321285247802734, 13.973965644836426, 14.626646041870117, 15.279326438903809, 15.9320068359375, 16.584688186645508, 17.237367630004883, 17.89004898071289, 18.542728424072266, 19.195409774780273, 19.84809112548828, 20.500770568847656]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 9.0, 8.0, 18.0, 20.0, 11.0, 15.0, 19.0, 32.0, 24.0, 30.0, 36.0, 55.0, 35.0, 40.0, 37.0, 43.0, 40.0, 39.0, 45.0, 34.0, 46.0, 36.0, 39.0, 26.0, 38.0, 34.0, 24.0, 27.0, 17.0, 21.0, 16.0, 14.0, 6.0, 8.0, 5.0, 10.0, 10.0, 3.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.891265869140625, -3.77081298828125, -3.650360107421875, -3.5299072265625, -3.409454345703125, -3.28900146484375, -3.168548583984375, -3.048095703125, -2.927642822265625, -2.80718994140625, -2.686737060546875, -2.5662841796875, -2.445831298828125, -2.32537841796875, -2.204925537109375, -2.08447265625, -1.964019775390625, -1.84356689453125, -1.723114013671875, -1.6026611328125, -1.482208251953125, -1.36175537109375, -1.241302490234375, -1.120849609375, -1.000396728515625, -0.87994384765625, -0.759490966796875, -0.6390380859375, -0.518585205078125, -0.39813232421875, -0.277679443359375, -0.1572265625, -0.036773681640625, 0.08367919921875, 0.204132080078125, 0.3245849609375, 0.445037841796875, 0.56549072265625, 0.685943603515625, 0.806396484375, 0.926849365234375, 1.04730224609375, 1.167755126953125, 1.2882080078125, 1.408660888671875, 1.52911376953125, 1.649566650390625, 1.77001953125, 1.890472412109375, 2.01092529296875, 2.131378173828125, 2.2518310546875, 2.372283935546875, 2.49273681640625, 2.613189697265625, 2.733642578125, 2.854095458984375, 2.97454833984375, 3.095001220703125, 3.2154541015625, 3.335906982421875, 3.45635986328125, 3.576812744140625, 3.697265625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 11.0, 20.0, 27.0, 39.0, 61.0, 89.0, 124.0, 159.0, 229.0, 327.0, 469.0, 679.0, 1091.0, 1519.0, 2326.0, 3259.0, 4877.0, 7304.0, 11235.0, 17707.0, 27862.0, 46023.0, 78465.0, 144342.0, 325031.0, 157492.0, 84751.0, 49164.0, 29797.0, 18434.0, 11830.0, 7904.0, 5129.0, 3295.0, 2346.0, 1523.0, 1082.0, 780.0, 558.0, 378.0, 253.0, 186.0, 131.0, 82.0, 51.0, 36.0, 25.0, 12.0, 13.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.27490234375, -0.26590728759765625, -0.2569122314453125, -0.24791717529296875, -0.238922119140625, -0.22992706298828125, -0.2209320068359375, -0.21193695068359375, -0.20294189453125, -0.19394683837890625, -0.1849517822265625, -0.17595672607421875, -0.166961669921875, -0.15796661376953125, -0.1489715576171875, -0.13997650146484375, -0.1309814453125, -0.12198638916015625, -0.1129913330078125, -0.10399627685546875, -0.095001220703125, -0.08600616455078125, -0.0770111083984375, -0.06801605224609375, -0.05902099609375, -0.05002593994140625, -0.0410308837890625, -0.03203582763671875, -0.023040771484375, -0.01404571533203125, -0.0050506591796875, 0.00394439697265625, 0.012939453125, 0.02193450927734375, 0.0309295654296875, 0.03992462158203125, 0.048919677734375, 0.05791473388671875, 0.0669097900390625, 0.07590484619140625, 0.08489990234375, 0.09389495849609375, 0.1028900146484375, 0.11188507080078125, 0.120880126953125, 0.12987518310546875, 0.1388702392578125, 0.14786529541015625, 0.1568603515625, 0.16585540771484375, 0.1748504638671875, 0.18384552001953125, 0.192840576171875, 0.20183563232421875, 0.2108306884765625, 0.21982574462890625, 0.22882080078125, 0.23781585693359375, 0.2468109130859375, 0.25580596923828125, 0.264801025390625, 0.27379608154296875, 0.2827911376953125, 0.29178619384765625, 0.30078125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 9.0, 8.0, 7.0, 8.0, 10.0, 19.0, 19.0, 20.0, 19.0, 12.0, 23.0, 26.0, 32.0, 26.0, 29.0, 41.0, 48.0, 36.0, 28.0, 51.0, 1060.0, 41.0, 42.0, 48.0, 45.0, 33.0, 25.0, 30.0, 23.0, 33.0, 23.0, 26.0, 20.0, 13.0, 12.0, 13.0, 15.0, 11.0, 8.0, 10.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.541015625, -2.462646484375, -2.38427734375, -2.305908203125, -2.2275390625, -2.149169921875, -2.07080078125, -1.992431640625, -1.9140625, -1.835693359375, -1.75732421875, -1.678955078125, -1.6005859375, -1.522216796875, -1.44384765625, -1.365478515625, -1.287109375, -1.208740234375, -1.13037109375, -1.052001953125, -0.9736328125, -0.895263671875, -0.81689453125, -0.738525390625, -0.66015625, -0.581787109375, -0.50341796875, -0.425048828125, -0.3466796875, -0.268310546875, -0.18994140625, -0.111572265625, -0.033203125, 0.045166015625, 0.12353515625, 0.201904296875, 0.2802734375, 0.358642578125, 0.43701171875, 0.515380859375, 0.59375, 0.672119140625, 0.75048828125, 0.828857421875, 0.9072265625, 0.985595703125, 1.06396484375, 1.142333984375, 1.220703125, 1.299072265625, 1.37744140625, 1.455810546875, 1.5341796875, 1.612548828125, 1.69091796875, 1.769287109375, 1.84765625, 1.926025390625, 2.00439453125, 2.082763671875, 2.1611328125, 2.239501953125, 2.31787109375, 2.396240234375, 2.474609375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 8.0, 7.0, 8.0, 18.0, 23.0, 25.0, 60.0, 74.0, 106.0, 167.0, 249.0, 293.0, 496.0, 745.0, 1139.0, 1642.0, 2375.0, 3711.0, 5780.0, 8704.0, 13739.0, 22051.0, 36592.0, 64655.0, 131603.0, 1417802.0, 185226.0, 82189.0, 44874.0, 26418.0, 16427.0, 10269.0, 6646.0, 4214.0, 2899.0, 1981.0, 1235.0, 850.0, 554.0, 437.0, 256.0, 189.0, 123.0, 79.0, 61.0, 55.0, 27.0, 17.0, 17.0, 3.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.165771484375, -0.1605396270751953, -0.15530776977539062, -0.15007591247558594, -0.14484405517578125, -0.13961219787597656, -0.13438034057617188, -0.1291484832763672, -0.1239166259765625, -0.11868476867675781, -0.11345291137695312, -0.10822105407714844, -0.10298919677734375, -0.09775733947753906, -0.09252548217773438, -0.08729362487792969, -0.082061767578125, -0.07682991027832031, -0.07159805297851562, -0.06636619567871094, -0.06113433837890625, -0.05590248107910156, -0.050670623779296875, -0.04543876647949219, -0.0402069091796875, -0.03497505187988281, -0.029743194580078125, -0.024511337280273438, -0.01927947998046875, -0.014047622680664062, -0.008815765380859375, -0.0035839080810546875, 0.00164794921875, 0.0068798065185546875, 0.012111663818359375, 0.017343521118164062, 0.02257537841796875, 0.027807235717773438, 0.033039093017578125, 0.03827095031738281, 0.0435028076171875, 0.04873466491699219, 0.053966522216796875, 0.05919837951660156, 0.06443023681640625, 0.06966209411621094, 0.07489395141601562, 0.08012580871582031, 0.085357666015625, 0.09058952331542969, 0.09582138061523438, 0.10105323791503906, 0.10628509521484375, 0.11151695251464844, 0.11674880981445312, 0.12198066711425781, 0.1272125244140625, 0.1324443817138672, 0.13767623901367188, 0.14290809631347656, 0.14813995361328125, 0.15337181091308594, 0.15860366821289062, 0.1638355255126953, 0.1690673828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 11.0, 12.0, 19.0, 3.0, 11.0, 23.0, 21.0, 41.0, 27.0, 52.0, 46.0, 68.0, 90.0, 77.0, 85.0, 59.0, 67.0, 47.0, 30.0, 36.0, 19.0, 16.0, 14.0, 13.0, 19.0, 10.0, 11.0, 5.0, 6.0, 7.0, 9.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1563301086425781e-05, -1.122988760471344e-05, -1.0896474123001099e-05, -1.0563060641288757e-05, -1.0229647159576416e-05, -9.896233677864075e-06, -9.562820196151733e-06, -9.229406714439392e-06, -8.89599323272705e-06, -8.56257975101471e-06, -8.229166269302368e-06, -7.895752787590027e-06, -7.5623393058776855e-06, -7.228925824165344e-06, -6.895512342453003e-06, -6.562098860740662e-06, -6.22868537902832e-06, -5.895271897315979e-06, -5.561858415603638e-06, -5.228444933891296e-06, -4.895031452178955e-06, -4.561617970466614e-06, -4.2282044887542725e-06, -3.894791007041931e-06, -3.56137752532959e-06, -3.2279640436172485e-06, -2.8945505619049072e-06, -2.561137080192566e-06, -2.2277235984802246e-06, -1.8943101167678833e-06, -1.560896635055542e-06, -1.2274831533432007e-06, -8.940696716308594e-07, -5.606561899185181e-07, -2.2724270820617676e-07, 1.0617077350616455e-07, 4.3958425521850586e-07, 7.729977369308472e-07, 1.1064112186431885e-06, 1.4398247003555298e-06, 1.773238182067871e-06, 2.1066516637802124e-06, 2.4400651454925537e-06, 2.773478627204895e-06, 3.1068921089172363e-06, 3.4403055906295776e-06, 3.773719072341919e-06, 4.10713255405426e-06, 4.4405460357666016e-06, 4.773959517478943e-06, 5.107372999191284e-06, 5.4407864809036255e-06, 5.774199962615967e-06, 6.107613444328308e-06, 6.441026926040649e-06, 6.774440407752991e-06, 7.107853889465332e-06, 7.441267371177673e-06, 7.774680852890015e-06, 8.108094334602356e-06, 8.441507816314697e-06, 8.774921298027039e-06, 9.10833477973938e-06, 9.441748261451721e-06, 9.775161743164062e-06]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 6.0, 8.0, 9.0, 5.0, 13.0, 17.0, 21.0, 27.0, 32.0, 40.0, 70.0, 106.0, 321.0, 1409.0, 9660.0, 105208.0, 839320.0, 82051.0, 8402.0, 1201.0, 276.0, 100.0, 62.0, 34.0, 24.0, 23.0, 14.0, 13.0, 8.0, 8.0, 12.0, 7.0, 7.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00020456314086914062, -0.0001978464424610138, -0.00019112974405288696, -0.00018441304564476013, -0.0001776963472366333, -0.00017097964882850647, -0.00016426295042037964, -0.0001575462520122528, -0.00015082955360412598, -0.00014411285519599915, -0.00013739615678787231, -0.00013067945837974548, -0.00012396275997161865, -0.00011724606156349182, -0.00011052936315536499, -0.00010381266474723816, -9.709596633911133e-05, -9.03792679309845e-05, -8.366256952285767e-05, -7.694587111473083e-05, -7.0229172706604e-05, -6.351247429847717e-05, -5.679577589035034e-05, -5.007907748222351e-05, -4.336237907409668e-05, -3.664568066596985e-05, -2.9928982257843018e-05, -2.3212283849716187e-05, -1.6495585441589355e-05, -9.778887033462524e-06, -3.0621886253356934e-06, 3.6545097827911377e-06, 1.0371208190917969e-05, 1.70879065990448e-05, 2.380460500717163e-05, 3.052130341529846e-05, 3.723800182342529e-05, 4.3954700231552124e-05, 5.0671398639678955e-05, 5.7388097047805786e-05, 6.410479545593262e-05, 7.082149386405945e-05, 7.753819227218628e-05, 8.425489068031311e-05, 9.097158908843994e-05, 9.768828749656677e-05, 0.0001044049859046936, 0.00011112168431282043, 0.00011783838272094727, 0.0001245550811290741, 0.00013127177953720093, 0.00013798847794532776, 0.0001447051763534546, 0.00015142187476158142, 0.00015813857316970825, 0.00016485527157783508, 0.00017157196998596191, 0.00017828866839408875, 0.00018500536680221558, 0.0001917220652103424, 0.00019843876361846924, 0.00020515546202659607, 0.0002118721604347229, 0.00021858885884284973, 0.00022530555725097656]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 6.0, 14.0, 20.0, 39.0, 90.0, 102.0, 154.0, 179.0, 155.0, 114.0, 61.0, 29.0, 24.0, 9.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.876788342604414e-06, -8.102773790596984e-06, -7.328759238589555e-06, -6.554745141329477e-06, -5.780730589322047e-06, -5.006716037314618e-06, -4.23270194005454e-06, -3.4586873880471103e-06, -2.684672836039681e-06, -1.9106582840322517e-06, -1.1366439593984978e-06, -3.6262963476474397e-07, 4.1138491724268533e-07, 1.1853994692501146e-06, 1.959413566510193e-06, 2.7334281185176224e-06, 3.5074426705250517e-06, 4.281457222532481e-06, 5.05547177453991e-06, 5.829485871799989e-06, 6.603500423807418e-06, 7.377514975814847e-06, 8.151529073074926e-06, 8.925543625082355e-06, 9.699558177089784e-06, 1.0473572729097214e-05, 1.1247587281104643e-05, 1.202160092361737e-05, 1.27956154756248e-05, 1.3569630027632229e-05, 1.4343644579639658e-05, 1.5117659131647088e-05, 1.5891673683654517e-05, 1.6665688235661946e-05, 1.7439702787669376e-05, 1.8213717339676805e-05, 1.8987731891684234e-05, 1.9761746443691663e-05, 2.0535760995699093e-05, 2.130977372871712e-05, 2.208379009971395e-05, 2.285780465172138e-05, 2.363181920372881e-05, 2.440583375573624e-05, 2.517984830774367e-05, 2.5953862859751098e-05, 2.6727877411758527e-05, 2.7501890144776553e-05, 2.8275904696783982e-05, 2.904991924879141e-05, 2.982393380079884e-05, 3.059794835280627e-05, 3.1371961085824296e-05, 3.214597745682113e-05, 3.2919990189839154e-05, 3.369400656083599e-05, 3.446801929385401e-05, 3.524203202687204e-05, 3.601604839786887e-05, 3.67900611308869e-05, 3.756407750188373e-05, 3.8338090234901756e-05, 3.911210660589859e-05, 3.9886119338916615e-05, 4.066013570991345e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 4.0, 12.0, 10.0, 12.0, 18.0, 17.0, 14.0, 20.0, 23.0, 25.0, 26.0, 40.0, 31.0, 32.0, 43.0, 26.0, 47.0, 51.0, 26.0, 46.0, 37.0, 38.0, 56.0, 26.0, 36.0, 36.0, 16.0, 36.0, 29.0, 19.0, 23.0, 19.0, 16.0, 9.0, 18.0, 8.0, 9.0, 6.0, 7.0, 5.0, 5.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.610046744346619e-06, -4.451721906661987e-06, -4.293397068977356e-06, -4.135072231292725e-06, -3.976747393608093e-06, -3.818422555923462e-06, -3.6600977182388306e-06, -3.5017728805541992e-06, -3.343448042869568e-06, -3.1851232051849365e-06, -3.026798367500305e-06, -2.868473529815674e-06, -2.7101486921310425e-06, -2.551823854446411e-06, -2.3934990167617798e-06, -2.2351741790771484e-06, -2.076849341392517e-06, -1.9185245037078857e-06, -1.7601996660232544e-06, -1.601874828338623e-06, -1.4435499906539917e-06, -1.2852251529693604e-06, -1.126900315284729e-06, -9.685754776000977e-07, -8.102506399154663e-07, -6.51925802230835e-07, -4.936009645462036e-07, -3.3527612686157227e-07, -1.7695128917694092e-07, -1.862645149230957e-08, 1.3969838619232178e-07, 2.980232238769531e-07, 4.5634806156158447e-07, 6.146728992462158e-07, 7.729977369308472e-07, 9.313225746154785e-07, 1.0896474123001099e-06, 1.2479722499847412e-06, 1.4062970876693726e-06, 1.564621925354004e-06, 1.7229467630386353e-06, 1.8812716007232666e-06, 2.039596438407898e-06, 2.1979212760925293e-06, 2.3562461137771606e-06, 2.514570951461792e-06, 2.6728957891464233e-06, 2.8312206268310547e-06, 2.989545464515686e-06, 3.1478703022003174e-06, 3.3061951398849487e-06, 3.46451997756958e-06, 3.6228448152542114e-06, 3.7811696529388428e-06, 3.939494490623474e-06, 4.0978193283081055e-06, 4.256144165992737e-06, 4.414469003677368e-06, 4.5727938413619995e-06, 4.731118679046631e-06, 4.889443516731262e-06, 5.0477683544158936e-06, 5.206093192100525e-06, 5.364418029785156e-06]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 9.0, 8.0, 18.0, 20.0, 11.0, 15.0, 19.0, 32.0, 24.0, 30.0, 36.0, 55.0, 35.0, 40.0, 37.0, 43.0, 40.0, 39.0, 45.0, 34.0, 46.0, 36.0, 39.0, 26.0, 38.0, 34.0, 24.0, 27.0, 17.0, 21.0, 16.0, 14.0, 6.0, 8.0, 5.0, 10.0, 10.0, 3.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.891265869140625, -3.77081298828125, -3.650360107421875, -3.5299072265625, -3.409454345703125, -3.28900146484375, -3.168548583984375, -3.048095703125, -2.927642822265625, -2.80718994140625, -2.686737060546875, -2.5662841796875, -2.445831298828125, -2.32537841796875, -2.204925537109375, -2.08447265625, -1.964019775390625, -1.84356689453125, -1.723114013671875, -1.6026611328125, -1.482208251953125, -1.36175537109375, -1.241302490234375, -1.120849609375, -1.000396728515625, -0.87994384765625, -0.759490966796875, -0.6390380859375, -0.518585205078125, -0.39813232421875, -0.277679443359375, -0.1572265625, -0.036773681640625, 0.08367919921875, 0.204132080078125, 0.3245849609375, 0.445037841796875, 0.56549072265625, 0.685943603515625, 0.806396484375, 0.926849365234375, 1.04730224609375, 1.167755126953125, 1.2882080078125, 1.408660888671875, 1.52911376953125, 1.649566650390625, 1.77001953125, 1.890472412109375, 2.01092529296875, 2.131378173828125, 2.2518310546875, 2.372283935546875, 2.49273681640625, 2.613189697265625, 2.733642578125, 2.854095458984375, 2.97454833984375, 3.095001220703125, 3.2154541015625, 3.335906982421875, 3.45635986328125, 3.576812744140625, 3.697265625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 4.0, 14.0, 10.0, 30.0, 54.0, 53.0, 108.0, 158.0, 264.0, 431.0, 742.0, 1291.0, 2357.0, 4703.0, 10378.0, 24542.0, 69131.0, 261063.0, 481842.0, 122729.0, 39254.0, 15403.0, 6713.0, 3260.0, 1631.0, 949.0, 545.0, 339.0, 175.0, 126.0, 72.0, 47.0, 31.0, 24.0, 13.0, 16.0, 9.0, 9.0, 6.0, 2.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.39892578125, -5.2314453125, -5.06396484375, -4.896484375, -4.72900390625, -4.5615234375, -4.39404296875, -4.2265625, -4.05908203125, -3.8916015625, -3.72412109375, -3.556640625, -3.38916015625, -3.2216796875, -3.05419921875, -2.88671875, -2.71923828125, -2.5517578125, -2.38427734375, -2.216796875, -2.04931640625, -1.8818359375, -1.71435546875, -1.546875, -1.37939453125, -1.2119140625, -1.04443359375, -0.876953125, -0.70947265625, -0.5419921875, -0.37451171875, -0.20703125, -0.03955078125, 0.1279296875, 0.29541015625, 0.462890625, 0.63037109375, 0.7978515625, 0.96533203125, 1.1328125, 1.30029296875, 1.4677734375, 1.63525390625, 1.802734375, 1.97021484375, 2.1376953125, 2.30517578125, 2.47265625, 2.64013671875, 2.8076171875, 2.97509765625, 3.142578125, 3.31005859375, 3.4775390625, 3.64501953125, 3.8125, 3.97998046875, 4.1474609375, 4.31494140625, 4.482421875, 4.64990234375, 4.8173828125, 4.98486328125, 5.15234375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 13.0, 9.0, 13.0, 18.0, 21.0, 15.0, 33.0, 35.0, 41.0, 45.0, 46.0, 61.0, 78.0, 203.0, 1774.0, 166.0, 80.0, 51.0, 38.0, 49.0, 32.0, 32.0, 29.0, 32.0, 20.0, 22.0, 19.0, 8.0, 9.0, 10.0, 7.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6875, -15.23193359375, -14.7763671875, -14.32080078125, -13.865234375, -13.40966796875, -12.9541015625, -12.49853515625, -12.04296875, -11.58740234375, -11.1318359375, -10.67626953125, -10.220703125, -9.76513671875, -9.3095703125, -8.85400390625, -8.3984375, -7.94287109375, -7.4873046875, -7.03173828125, -6.576171875, -6.12060546875, -5.6650390625, -5.20947265625, -4.75390625, -4.29833984375, -3.8427734375, -3.38720703125, -2.931640625, -2.47607421875, -2.0205078125, -1.56494140625, -1.109375, -0.65380859375, -0.1982421875, 0.25732421875, 0.712890625, 1.16845703125, 1.6240234375, 2.07958984375, 2.53515625, 2.99072265625, 3.4462890625, 3.90185546875, 4.357421875, 4.81298828125, 5.2685546875, 5.72412109375, 6.1796875, 6.63525390625, 7.0908203125, 7.54638671875, 8.001953125, 8.45751953125, 8.9130859375, 9.36865234375, 9.82421875, 10.27978515625, 10.7353515625, 11.19091796875, 11.646484375, 12.10205078125, 12.5576171875, 13.01318359375, 13.46875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 3.0, 9.0, 10.0, 8.0, 15.0, 19.0, 20.0, 28.0, 25.0, 45.0, 56.0, 72.0, 100.0, 217.0, 403.0, 2398.0, 130899.0, 2997792.0, 11959.0, 873.0, 233.0, 145.0, 98.0, 64.0, 55.0, 31.0, 13.0, 25.0, 16.0, 11.0, 6.0, 20.0, 12.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.546875, -27.571044921875, -26.59521484375, -25.619384765625, -24.6435546875, -23.667724609375, -22.69189453125, -21.716064453125, -20.740234375, -19.764404296875, -18.78857421875, -17.812744140625, -16.8369140625, -15.861083984375, -14.88525390625, -13.909423828125, -12.93359375, -11.957763671875, -10.98193359375, -10.006103515625, -9.0302734375, -8.054443359375, -7.07861328125, -6.102783203125, -5.126953125, -4.151123046875, -3.17529296875, -2.199462890625, -1.2236328125, -0.247802734375, 0.72802734375, 1.703857421875, 2.6796875, 3.655517578125, 4.63134765625, 5.607177734375, 6.5830078125, 7.558837890625, 8.53466796875, 9.510498046875, 10.486328125, 11.462158203125, 12.43798828125, 13.413818359375, 14.3896484375, 15.365478515625, 16.34130859375, 17.317138671875, 18.29296875, 19.268798828125, 20.24462890625, 21.220458984375, 22.1962890625, 23.172119140625, 24.14794921875, 25.123779296875, 26.099609375, 27.075439453125, 28.05126953125, 29.027099609375, 30.0029296875, 30.978759765625, 31.95458984375, 32.930419921875, 33.90625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 24.0, 157.0, 452.0, 316.0, 57.0, 9.0], "bins": [-119.11033630371094, -117.14849090576172, -115.18665313720703, -113.22480773925781, -111.26296997070312, -109.3011245727539, -107.33928680419922, -105.37744140625, -103.41560363769531, -101.4537582397461, -99.4919204711914, -97.53007507324219, -95.5682373046875, -93.60639190673828, -91.6445541381836, -89.68270874023438, -87.72086334228516, -85.75901794433594, -83.79718017578125, -81.83533477783203, -79.87349700927734, -77.91165161132812, -75.94981384277344, -73.98796844482422, -72.02613067626953, -70.06428527832031, -68.10244750976562, -66.1406021118164, -64.17876434326172, -62.2169189453125, -60.25508117675781, -58.293235778808594, -56.33139419555664, -54.36955261230469, -52.407711029052734, -50.44586944580078, -48.48402786254883, -46.522186279296875, -44.560340881347656, -42.5984992980957, -40.63665771484375, -38.6748161315918, -36.712974548339844, -34.75113296508789, -32.78929138183594, -30.82744789123535, -28.8656063079834, -26.903762817382812, -24.94192123413086, -22.980079650878906, -21.018238067626953, -19.056396484375, -17.094552993774414, -15.132711410522461, -13.170869827270508, -11.209027290344238, -9.247186660766602, -7.28534460067749, -5.323502540588379, -3.361660957336426, -1.3998188972473145, 0.5620231628417969, 2.52386474609375, 4.4857072830200195, 6.447549343109131]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 9.0, 7.0, 16.0, 10.0, 29.0, 18.0, 28.0, 27.0, 30.0, 28.0, 29.0, 37.0, 45.0, 36.0, 42.0, 45.0, 48.0, 38.0, 44.0, 39.0, 43.0, 33.0, 33.0, 21.0, 30.0, 25.0, 22.0, 21.0, 20.0, 15.0, 28.0, 19.0, 18.0, 11.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-37.77830123901367, -36.658756256103516, -35.53921127319336, -34.4196662902832, -33.30012130737305, -32.18057632446289, -31.061031341552734, -29.941486358642578, -28.821941375732422, -27.702396392822266, -26.58285140991211, -25.463306427001953, -24.343761444091797, -23.22421646118164, -22.104671478271484, -20.985126495361328, -19.86557960510254, -18.746034622192383, -17.626489639282227, -16.50694465637207, -15.387399673461914, -14.267854690551758, -13.148308753967285, -12.028763771057129, -10.909218788146973, -9.789673805236816, -8.67012882232666, -7.550583362579346, -6.4310383796691895, -5.311493396759033, -4.191947937011719, -3.0724029541015625, -1.9528579711914062, -0.8333128690719604, 0.28623223304748535, 1.4057774543762207, 2.525322437286377, 3.644867420196533, 4.764412879943848, 5.883957862854004, 7.00350284576416, 8.123047828674316, 9.242592811584473, 10.362138748168945, 11.481683731079102, 12.601228713989258, 13.720773696899414, 14.84031867980957, 15.959863662719727, 17.079408645629883, 18.19895362854004, 19.318498611450195, 20.43804359436035, 21.557588577270508, 22.677135467529297, 23.796680450439453, 24.91622543334961, 26.035770416259766, 27.155315399169922, 28.274860382080078, 29.394405364990234, 30.51395034790039, 31.633495330810547, 32.7530403137207, 33.87258529663086]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 9.0, 2.0, 12.0, 5.0, 6.0, 14.0, 16.0, 15.0, 16.0, 26.0, 26.0, 26.0, 36.0, 31.0, 44.0, 41.0, 33.0, 39.0, 40.0, 46.0, 45.0, 35.0, 48.0, 37.0, 37.0, 28.0, 40.0, 38.0, 36.0, 25.0, 19.0, 20.0, 16.0, 18.0, 8.0, 14.0, 9.0, 11.0, 8.0, 2.0, 5.0, 9.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.38671875, -4.262908935546875, -4.13909912109375, -4.015289306640625, -3.8914794921875, -3.767669677734375, -3.64385986328125, -3.520050048828125, -3.396240234375, -3.272430419921875, -3.14862060546875, -3.024810791015625, -2.9010009765625, -2.777191162109375, -2.65338134765625, -2.529571533203125, -2.40576171875, -2.281951904296875, -2.15814208984375, -2.034332275390625, -1.9105224609375, -1.786712646484375, -1.66290283203125, -1.539093017578125, -1.415283203125, -1.291473388671875, -1.16766357421875, -1.043853759765625, -0.9200439453125, -0.796234130859375, -0.67242431640625, -0.548614501953125, -0.4248046875, -0.300994873046875, -0.17718505859375, -0.053375244140625, 0.0704345703125, 0.194244384765625, 0.31805419921875, 0.441864013671875, 0.565673828125, 0.689483642578125, 0.81329345703125, 0.937103271484375, 1.0609130859375, 1.184722900390625, 1.30853271484375, 1.432342529296875, 1.55615234375, 1.679962158203125, 1.80377197265625, 1.927581787109375, 2.0513916015625, 2.175201416015625, 2.29901123046875, 2.422821044921875, 2.546630859375, 2.670440673828125, 2.79425048828125, 2.918060302734375, 3.0418701171875, 3.165679931640625, 3.28948974609375, 3.413299560546875, 3.537109375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 7.0, 15.0, 21.0, 39.0, 50.0, 65.0, 103.0, 121.0, 196.0, 278.0, 470.0, 630.0, 976.0, 1474.0, 2470.0, 3992.0, 6588.0, 11591.0, 21178.0, 41321.0, 88514.0, 210004.0, 544618.0, 1271664.0, 1162611.0, 476143.0, 185737.0, 79612.0, 37672.0, 19384.0, 10899.0, 6122.0, 3590.0, 2214.0, 1316.0, 880.0, 537.0, 395.0, 248.0, 164.0, 128.0, 79.0, 50.0, 40.0, 16.0, 23.0, 12.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.912109375, -3.781402587890625, -3.65069580078125, -3.519989013671875, -3.3892822265625, -3.258575439453125, -3.12786865234375, -2.997161865234375, -2.866455078125, -2.735748291015625, -2.60504150390625, -2.474334716796875, -2.3436279296875, -2.212921142578125, -2.08221435546875, -1.951507568359375, -1.82080078125, -1.690093994140625, -1.55938720703125, -1.428680419921875, -1.2979736328125, -1.167266845703125, -1.03656005859375, -0.905853271484375, -0.775146484375, -0.644439697265625, -0.51373291015625, -0.383026123046875, -0.2523193359375, -0.121612548828125, 0.00909423828125, 0.139801025390625, 0.2705078125, 0.401214599609375, 0.53192138671875, 0.662628173828125, 0.7933349609375, 0.924041748046875, 1.05474853515625, 1.185455322265625, 1.316162109375, 1.446868896484375, 1.57757568359375, 1.708282470703125, 1.8389892578125, 1.969696044921875, 2.10040283203125, 2.231109619140625, 2.36181640625, 2.492523193359375, 2.62322998046875, 2.753936767578125, 2.8846435546875, 3.015350341796875, 3.14605712890625, 3.276763916015625, 3.407470703125, 3.538177490234375, 3.66888427734375, 3.799591064453125, 3.9302978515625, 4.061004638671875, 4.19171142578125, 4.322418212890625, 4.453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 6.0, 11.0, 20.0, 27.0, 35.0, 50.0, 61.0, 63.0, 101.0, 100.0, 160.0, 206.0, 303.0, 325.0, 472.0, 506.0, 369.0, 323.0, 219.0, 164.0, 125.0, 103.0, 68.0, 47.0, 45.0, 42.0, 28.0, 18.0, 19.0, 12.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.40606689453125, -5.2066650390625, -5.00726318359375, -4.807861328125, -4.60845947265625, -4.4090576171875, -4.20965576171875, -4.01025390625, -3.81085205078125, -3.6114501953125, -3.41204833984375, -3.212646484375, -3.01324462890625, -2.8138427734375, -2.61444091796875, -2.4150390625, -2.21563720703125, -2.0162353515625, -1.81683349609375, -1.617431640625, -1.41802978515625, -1.2186279296875, -1.01922607421875, -0.81982421875, -0.62042236328125, -0.4210205078125, -0.22161865234375, -0.022216796875, 0.17718505859375, 0.3765869140625, 0.57598876953125, 0.775390625, 0.97479248046875, 1.1741943359375, 1.37359619140625, 1.572998046875, 1.77239990234375, 1.9718017578125, 2.17120361328125, 2.37060546875, 2.57000732421875, 2.7694091796875, 2.96881103515625, 3.168212890625, 3.36761474609375, 3.5670166015625, 3.76641845703125, 3.9658203125, 4.16522216796875, 4.3646240234375, 4.56402587890625, 4.763427734375, 4.96282958984375, 5.1622314453125, 5.36163330078125, 5.56103515625, 5.76043701171875, 5.9598388671875, 6.15924072265625, 6.358642578125, 6.55804443359375, 6.7574462890625, 6.95684814453125, 7.15625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 1.0, 4.0, 12.0, 24.0, 18.0, 49.0, 51.0, 77.0, 83.0, 149.0, 257.0, 367.0, 1101.0, 6490.0, 153276.0, 3752204.0, 268355.0, 9257.0, 1302.0, 437.0, 242.0, 166.0, 115.0, 81.0, 54.0, 36.0, 25.0, 20.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.859375, -25.980712890625, -25.10205078125, -24.223388671875, -23.3447265625, -22.466064453125, -21.58740234375, -20.708740234375, -19.830078125, -18.951416015625, -18.07275390625, -17.194091796875, -16.3154296875, -15.436767578125, -14.55810546875, -13.679443359375, -12.80078125, -11.922119140625, -11.04345703125, -10.164794921875, -9.2861328125, -8.407470703125, -7.52880859375, -6.650146484375, -5.771484375, -4.892822265625, -4.01416015625, -3.135498046875, -2.2568359375, -1.378173828125, -0.49951171875, 0.379150390625, 1.2578125, 2.136474609375, 3.01513671875, 3.893798828125, 4.7724609375, 5.651123046875, 6.52978515625, 7.408447265625, 8.287109375, 9.165771484375, 10.04443359375, 10.923095703125, 11.8017578125, 12.680419921875, 13.55908203125, 14.437744140625, 15.31640625, 16.195068359375, 17.07373046875, 17.952392578125, 18.8310546875, 19.709716796875, 20.58837890625, 21.467041015625, 22.345703125, 23.224365234375, 24.10302734375, 24.981689453125, 25.8603515625, 26.739013671875, 27.61767578125, 28.496337890625, 29.375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 17.0, 52.0, 116.0, 181.0, 204.0, 192.0, 132.0, 61.0, 29.0, 12.0, 6.0, 7.0, 1.0, 0.0, 1.0, 1.0], "bins": [-112.98712158203125, -110.84354400634766, -108.69995880126953, -106.55638122558594, -104.41280364990234, -102.26922607421875, -100.12564086914062, -97.98206329345703, -95.83848571777344, -93.69490814208984, -91.55132293701172, -89.40774536132812, -87.26416778564453, -85.12059020996094, -82.97700500488281, -80.83342742919922, -78.6898422241211, -76.5462646484375, -74.40267944335938, -72.25910186767578, -70.11552429199219, -67.97193908691406, -65.82836151123047, -63.684783935546875, -61.541202545166016, -59.397621154785156, -57.25404357910156, -55.1104621887207, -52.966880798339844, -50.82330322265625, -48.67972183227539, -46.53614044189453, -44.39256286621094, -42.24898147583008, -40.105403900146484, -37.961822509765625, -35.81824493408203, -33.67466354370117, -31.531082153320312, -29.387502670288086, -27.243925094604492, -25.100345611572266, -22.956764221191406, -20.81318473815918, -18.669605255126953, -16.526025772094727, -14.382445335388184, -12.23886489868164, -10.095285415649414, -7.951705455780029, -5.8081254959106445, -3.6645455360412598, -1.520965576171875, 0.6226139068603516, 2.7661943435668945, 4.9097747802734375, 7.053354263305664, 9.19693374633789, 11.340514183044434, 13.484094619750977, 15.627674102783203, 17.77125358581543, 19.914833068847656, 22.058414459228516, 24.201993942260742]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 7.0, 5.0, 11.0, 10.0, 8.0, 8.0, 16.0, 20.0, 13.0, 19.0, 22.0, 30.0, 22.0, 30.0, 33.0, 31.0, 35.0, 41.0, 35.0, 39.0, 58.0, 33.0, 36.0, 37.0, 29.0, 29.0, 28.0, 32.0, 26.0, 20.0, 37.0, 30.0, 22.0, 23.0, 16.0, 15.0, 19.0, 9.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-23.672319412231445, -22.988147735595703, -22.30397605895996, -21.61980438232422, -20.935632705688477, -20.251461029052734, -19.567289352416992, -18.88311767578125, -18.198945999145508, -17.514774322509766, -16.830602645874023, -16.14643096923828, -15.462259292602539, -14.778087615966797, -14.093915939331055, -13.409744262695312, -12.72557258605957, -12.041400909423828, -11.357229232788086, -10.673057556152344, -9.988885879516602, -9.30471420288086, -8.620542526245117, -7.936370849609375, -7.252199172973633, -6.568027496337891, -5.883855819702148, -5.199684143066406, -4.515512466430664, -3.831340789794922, -3.1471691131591797, -2.4629974365234375, -1.7788257598876953, -1.0946540832519531, -0.41048240661621094, 0.27368927001953125, 0.9578609466552734, 1.6420326232910156, 2.326204299926758, 3.0103759765625, 3.694547653198242, 4.378719329833984, 5.062891006469727, 5.747062683105469, 6.431234359741211, 7.115406036376953, 7.799577713012695, 8.483749389648438, 9.16792106628418, 9.852092742919922, 10.536264419555664, 11.220436096191406, 11.904607772827148, 12.58877944946289, 13.272951126098633, 13.957122802734375, 14.641294479370117, 15.32546615600586, 16.0096378326416, 16.693809509277344, 17.377981185913086, 18.062152862548828, 18.74632453918457, 19.430496215820312, 20.114667892456055]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 8.0, 6.0, 9.0, 15.0, 16.0, 16.0, 27.0, 26.0, 27.0, 35.0, 37.0, 35.0, 37.0, 46.0, 52.0, 44.0, 43.0, 27.0, 38.0, 35.0, 43.0, 45.0, 37.0, 31.0, 28.0, 33.0, 22.0, 27.0, 27.0, 16.0, 17.0, 14.0, 10.0, 10.0, 3.0, 14.0, 6.0, 9.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-4.2890625, -4.16082763671875, -4.0325927734375, -3.90435791015625, -3.776123046875, -3.64788818359375, -3.5196533203125, -3.39141845703125, -3.26318359375, -3.13494873046875, -3.0067138671875, -2.87847900390625, -2.750244140625, -2.62200927734375, -2.4937744140625, -2.36553955078125, -2.2373046875, -2.10906982421875, -1.9808349609375, -1.85260009765625, -1.724365234375, -1.59613037109375, -1.4678955078125, -1.33966064453125, -1.21142578125, -1.08319091796875, -0.9549560546875, -0.82672119140625, -0.698486328125, -0.57025146484375, -0.4420166015625, -0.31378173828125, -0.185546875, -0.05731201171875, 0.0709228515625, 0.19915771484375, 0.327392578125, 0.45562744140625, 0.5838623046875, 0.71209716796875, 0.84033203125, 0.96856689453125, 1.0968017578125, 1.22503662109375, 1.353271484375, 1.48150634765625, 1.6097412109375, 1.73797607421875, 1.8662109375, 1.99444580078125, 2.1226806640625, 2.25091552734375, 2.379150390625, 2.50738525390625, 2.6356201171875, 2.76385498046875, 2.89208984375, 3.02032470703125, 3.1485595703125, 3.27679443359375, 3.405029296875, 3.53326416015625, 3.6614990234375, 3.78973388671875, 3.91796875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 7.0, 10.0, 5.0, 13.0, 21.0, 25.0, 42.0, 56.0, 90.0, 143.0, 205.0, 260.0, 368.0, 559.0, 764.0, 1180.0, 1575.0, 2380.0, 3445.0, 5164.0, 7827.0, 11808.0, 18608.0, 29654.0, 49490.0, 86051.0, 170802.0, 313009.0, 146252.0, 76792.0, 44720.0, 26954.0, 17144.0, 10991.0, 7168.0, 4824.0, 3207.0, 2126.0, 1446.0, 1051.0, 730.0, 496.0, 350.0, 249.0, 148.0, 110.0, 80.0, 60.0, 35.0, 33.0, 11.0, 15.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.292236328125, -0.282623291015625, -0.27301025390625, -0.263397216796875, -0.2537841796875, -0.244171142578125, -0.23455810546875, -0.224945068359375, -0.21533203125, -0.205718994140625, -0.19610595703125, -0.186492919921875, -0.1768798828125, -0.167266845703125, -0.15765380859375, -0.148040771484375, -0.138427734375, -0.128814697265625, -0.11920166015625, -0.109588623046875, -0.0999755859375, -0.090362548828125, -0.08074951171875, -0.071136474609375, -0.0615234375, -0.051910400390625, -0.04229736328125, -0.032684326171875, -0.0230712890625, -0.013458251953125, -0.00384521484375, 0.005767822265625, 0.015380859375, 0.024993896484375, 0.03460693359375, 0.044219970703125, 0.0538330078125, 0.063446044921875, 0.07305908203125, 0.082672119140625, 0.09228515625, 0.101898193359375, 0.11151123046875, 0.121124267578125, 0.1307373046875, 0.140350341796875, 0.14996337890625, 0.159576416015625, 0.169189453125, 0.178802490234375, 0.18841552734375, 0.198028564453125, 0.2076416015625, 0.217254638671875, 0.22686767578125, 0.236480712890625, 0.24609375, 0.255706787109375, 0.26531982421875, 0.274932861328125, 0.2845458984375, 0.294158935546875, 0.30377197265625, 0.313385009765625, 0.322998046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 9.0, 12.0, 13.0, 17.0, 14.0, 17.0, 22.0, 26.0, 35.0, 32.0, 33.0, 34.0, 37.0, 44.0, 40.0, 44.0, 45.0, 1064.0, 57.0, 43.0, 39.0, 43.0, 33.0, 27.0, 41.0, 30.0, 25.0, 28.0, 16.0, 17.0, 17.0, 16.0, 13.0, 13.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.092132568359375, -2.99676513671875, -2.901397705078125, -2.8060302734375, -2.710662841796875, -2.61529541015625, -2.519927978515625, -2.424560546875, -2.329193115234375, -2.23382568359375, -2.138458251953125, -2.0430908203125, -1.947723388671875, -1.85235595703125, -1.756988525390625, -1.66162109375, -1.566253662109375, -1.47088623046875, -1.375518798828125, -1.2801513671875, -1.184783935546875, -1.08941650390625, -0.994049072265625, -0.898681640625, -0.803314208984375, -0.70794677734375, -0.612579345703125, -0.5172119140625, -0.421844482421875, -0.32647705078125, -0.231109619140625, -0.1357421875, -0.040374755859375, 0.05499267578125, 0.150360107421875, 0.2457275390625, 0.341094970703125, 0.43646240234375, 0.531829833984375, 0.627197265625, 0.722564697265625, 0.81793212890625, 0.913299560546875, 1.0086669921875, 1.104034423828125, 1.19940185546875, 1.294769287109375, 1.39013671875, 1.485504150390625, 1.58087158203125, 1.676239013671875, 1.7716064453125, 1.866973876953125, 1.96234130859375, 2.057708740234375, 2.153076171875, 2.248443603515625, 2.34381103515625, 2.439178466796875, 2.5345458984375, 2.629913330078125, 2.72528076171875, 2.820648193359375, 2.916015625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 22.0, 17.0, 23.0, 39.0, 66.0, 79.0, 149.0, 202.0, 317.0, 483.0, 695.0, 1169.0, 1837.0, 2905.0, 4655.0, 7533.0, 12586.0, 21289.0, 37396.0, 69750.0, 148805.0, 1450367.0, 164631.0, 74941.0, 39917.0, 22702.0, 13276.0, 7933.0, 4858.0, 3088.0, 1908.0, 1189.0, 804.0, 500.0, 334.0, 199.0, 147.0, 104.0, 74.0, 40.0, 28.0, 25.0, 9.0, 9.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18821144104003906, -0.18184280395507812, -0.1754741668701172, -0.16910552978515625, -0.1627368927001953, -0.15636825561523438, -0.14999961853027344, -0.1436309814453125, -0.13726234436035156, -0.13089370727539062, -0.12452507019042969, -0.11815643310546875, -0.11178779602050781, -0.10541915893554688, -0.09905052185058594, -0.092681884765625, -0.08631324768066406, -0.07994461059570312, -0.07357597351074219, -0.06720733642578125, -0.06083869934082031, -0.054470062255859375, -0.04810142517089844, -0.0417327880859375, -0.03536415100097656, -0.028995513916015625, -0.022626876831054688, -0.01625823974609375, -0.009889602661132812, -0.003520965576171875, 0.0028476715087890625, 0.00921630859375, 0.015584945678710938, 0.021953582763671875, 0.028322219848632812, 0.03469085693359375, 0.04105949401855469, 0.047428131103515625, 0.05379676818847656, 0.0601654052734375, 0.06653404235839844, 0.07290267944335938, 0.07927131652832031, 0.08563995361328125, 0.09200859069824219, 0.09837722778320312, 0.10474586486816406, 0.111114501953125, 0.11748313903808594, 0.12385177612304688, 0.1302204132080078, 0.13658905029296875, 0.1429576873779297, 0.14932632446289062, 0.15569496154785156, 0.1620635986328125, 0.16843223571777344, 0.17480087280273438, 0.1811695098876953, 0.18753814697265625, 0.1939067840576172, 0.20027542114257812, 0.20664405822753906, 0.2130126953125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 0.0, 0.0, 8.0, 4.0, 7.0, 14.0, 6.0, 11.0, 16.0, 25.0, 19.0, 23.0, 37.0, 45.0, 54.0, 63.0, 76.0, 67.0, 89.0, 86.0, 65.0, 55.0, 42.0, 24.0, 27.0, 21.0, 15.0, 10.0, 16.0, 10.0, 13.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0], "bins": [-3.081560134887695e-05, -2.9955990612506866e-05, -2.909637987613678e-05, -2.8236769139766693e-05, -2.7377158403396606e-05, -2.651754766702652e-05, -2.5657936930656433e-05, -2.4798326194286346e-05, -2.393871545791626e-05, -2.3079104721546173e-05, -2.2219493985176086e-05, -2.1359883248806e-05, -2.0500272512435913e-05, -1.9640661776065826e-05, -1.878105103969574e-05, -1.7921440303325653e-05, -1.7061829566955566e-05, -1.620221883058548e-05, -1.5342608094215393e-05, -1.4482997357845306e-05, -1.362338662147522e-05, -1.2763775885105133e-05, -1.1904165148735046e-05, -1.104455441236496e-05, -1.0184943675994873e-05, -9.325332939624786e-06, -8.4657222032547e-06, -7.606111466884613e-06, -6.746500730514526e-06, -5.88688999414444e-06, -5.027279257774353e-06, -4.167668521404266e-06, -3.3080577850341797e-06, -2.448447048664093e-06, -1.5888363122940063e-06, -7.292255759239197e-07, 1.30385160446167e-07, 9.899958968162537e-07, 1.8496066331863403e-06, 2.709217369556427e-06, 3.5688281059265137e-06, 4.4284388422966e-06, 5.288049578666687e-06, 6.147660315036774e-06, 7.00727105140686e-06, 7.866881787776947e-06, 8.726492524147034e-06, 9.58610326051712e-06, 1.0445713996887207e-05, 1.1305324733257294e-05, 1.216493546962738e-05, 1.3024546205997467e-05, 1.3884156942367554e-05, 1.474376767873764e-05, 1.5603378415107727e-05, 1.6462989151477814e-05, 1.73225998878479e-05, 1.8182210624217987e-05, 1.9041821360588074e-05, 1.990143209695816e-05, 2.0761042833328247e-05, 2.1620653569698334e-05, 2.248026430606842e-05, 2.3339875042438507e-05, 2.4199485778808594e-05]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 7.0, 4.0, 16.0, 14.0, 11.0, 9.0, 32.0, 30.0, 42.0, 53.0, 93.0, 140.0, 352.0, 3628.0, 885580.0, 156629.0, 1241.0, 209.0, 120.0, 78.0, 54.0, 35.0, 27.0, 25.0, 21.0, 10.0, 6.0, 14.0, 12.0, 4.0, 7.0, 0.0, 0.0, 6.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0005407333374023438, -0.0005219951272010803, -0.0005032569169998169, -0.00048451870679855347, -0.00046578049659729004, -0.0004470422863960266, -0.0004283040761947632, -0.00040956586599349976, -0.00039082765579223633, -0.0003720894455909729, -0.00035335123538970947, -0.00033461302518844604, -0.0003158748149871826, -0.0002971366047859192, -0.00027839839458465576, -0.00025966018438339233, -0.0002409219741821289, -0.00022218376398086548, -0.00020344555377960205, -0.00018470734357833862, -0.0001659691333770752, -0.00014723092317581177, -0.00012849271297454834, -0.00010975450277328491, -9.101629257202148e-05, -7.227808237075806e-05, -5.353987216949463e-05, -3.48016619682312e-05, -1.6063451766967773e-05, 2.6747584342956543e-06, 2.1412968635559082e-05, 4.015117883682251e-05, 5.888938903808594e-05, 7.762759923934937e-05, 9.636580944061279e-05, 0.00011510401964187622, 0.00013384222984313965, 0.00015258044004440308, 0.0001713186502456665, 0.00019005686044692993, 0.00020879507064819336, 0.0002275332808494568, 0.0002462714910507202, 0.00026500970125198364, 0.00028374791145324707, 0.0003024861216545105, 0.0003212243318557739, 0.00033996254205703735, 0.0003587007522583008, 0.0003774389624595642, 0.00039617717266082764, 0.00041491538286209106, 0.0004336535930633545, 0.0004523918032646179, 0.00047113001346588135, 0.0004898682236671448, 0.0005086064338684082, 0.0005273446440696716, 0.0005460828542709351, 0.0005648210644721985, 0.0005835592746734619, 0.0006022974848747253, 0.0006210356950759888, 0.0006397739052772522, 0.0006585121154785156]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 42.0, 441.0, 479.0, 48.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001952902675839141, -0.00019174168119207025, -0.0001881930948002264, -0.00018464450840838253, -0.00018109590746462345, -0.0001775473210727796, -0.00017399873468093574, -0.00017045014828909189, -0.00016690156189724803, -0.00016335297550540417, -0.00015980438911356032, -0.00015625580272171646, -0.0001527072163298726, -0.00014915861538611352, -0.00014561002899426967, -0.00014206144260242581, -0.00013851285621058196, -0.0001349642698187381, -0.00013141568342689425, -0.0001278670970350504, -0.0001243184960912913, -0.00012076991697540507, -0.0001172213233076036, -0.00011367273691575974, -0.00011012415052391589, -0.00010657556413207203, -0.00010302697774022818, -9.94783840724267e-05, -9.592979768058285e-05, -9.2381211288739e-05, -8.883261762093753e-05, -8.528403122909367e-05, -8.17354375612922e-05, -7.818685116944835e-05, -7.463825750164688e-05, -7.108967110980302e-05, -6.754108471795917e-05, -6.399249832611531e-05, -6.044390829629265e-05, -5.6895318266469985e-05, -5.334673187462613e-05, -4.9798145482782274e-05, -4.624955545295961e-05, -4.270096542313695e-05, -3.9152379031293094e-05, -3.560379263944924e-05, -3.2055202609626576e-05, -2.8506614398793317e-05, -2.495802618796006e-05, -2.14094379771268e-05, -1.786084976629354e-05, -1.4312261555460282e-05, -1.0763673344627023e-05, -7.215085133793764e-06, -3.666496922960505e-06, -1.1790871212724596e-07, 3.430679498706013e-06, 6.979267709539272e-06, 1.052785592037253e-05, 1.407644413120579e-05, 1.762503234203905e-05, 2.1173620552872308e-05, 2.4722208763705567e-05, 2.8270796974538825e-05, 3.1819385185372084e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 13.0, 8.0, 10.0, 5.0, 18.0, 8.0, 13.0, 18.0, 20.0, 20.0, 25.0, 29.0, 30.0, 25.0, 37.0, 34.0, 46.0, 52.0, 42.0, 47.0, 45.0, 33.0, 32.0, 40.0, 34.0, 30.0, 41.0, 29.0, 18.0, 30.0, 21.0, 23.0, 16.0, 11.0, 16.0, 12.0, 18.0, 8.0, 12.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.3226643204689026e-05, -1.2803822755813599e-05, -1.2381002306938171e-05, -1.1958181858062744e-05, -1.1535361409187317e-05, -1.111254096031189e-05, -1.0689720511436462e-05, -1.0266900062561035e-05, -9.844079613685608e-06, -9.42125916481018e-06, -8.998438715934753e-06, -8.575618267059326e-06, -8.152797818183899e-06, -7.729977369308472e-06, -7.3071569204330444e-06, -6.884336471557617e-06, -6.46151602268219e-06, -6.038695573806763e-06, -5.6158751249313354e-06, -5.193054676055908e-06, -4.770234227180481e-06, -4.347413778305054e-06, -3.9245933294296265e-06, -3.5017728805541992e-06, -3.078952431678772e-06, -2.6561319828033447e-06, -2.2333115339279175e-06, -1.8104910850524902e-06, -1.387670636177063e-06, -9.648501873016357e-07, -5.420297384262085e-07, -1.1920928955078125e-07, 3.03611159324646e-07, 7.264316082000732e-07, 1.1492520570755005e-06, 1.5720725059509277e-06, 1.994892954826355e-06, 2.4177134037017822e-06, 2.8405338525772095e-06, 3.2633543014526367e-06, 3.686174750328064e-06, 4.108995199203491e-06, 4.5318156480789185e-06, 4.954636096954346e-06, 5.377456545829773e-06, 5.8002769947052e-06, 6.2230974435806274e-06, 6.645917892456055e-06, 7.068738341331482e-06, 7.491558790206909e-06, 7.914379239082336e-06, 8.337199687957764e-06, 8.760020136833191e-06, 9.182840585708618e-06, 9.605661034584045e-06, 1.0028481483459473e-05, 1.04513019323349e-05, 1.0874122381210327e-05, 1.1296942830085754e-05, 1.1719763278961182e-05, 1.2142583727836609e-05, 1.2565404176712036e-05, 1.2988224625587463e-05, 1.341104507446289e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 8.0, 6.0, 9.0, 15.0, 16.0, 16.0, 27.0, 26.0, 27.0, 35.0, 37.0, 35.0, 37.0, 46.0, 52.0, 44.0, 43.0, 27.0, 38.0, 35.0, 43.0, 45.0, 37.0, 31.0, 28.0, 33.0, 22.0, 27.0, 27.0, 16.0, 17.0, 14.0, 10.0, 10.0, 3.0, 14.0, 6.0, 9.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-4.2890625, -4.16082763671875, -4.0325927734375, -3.90435791015625, -3.776123046875, -3.64788818359375, -3.5196533203125, -3.39141845703125, -3.26318359375, -3.13494873046875, -3.0067138671875, -2.87847900390625, -2.750244140625, -2.62200927734375, -2.4937744140625, -2.36553955078125, -2.2373046875, -2.10906982421875, -1.9808349609375, -1.85260009765625, -1.724365234375, -1.59613037109375, -1.4678955078125, -1.33966064453125, -1.21142578125, -1.08319091796875, -0.9549560546875, -0.82672119140625, -0.698486328125, -0.57025146484375, -0.4420166015625, -0.31378173828125, -0.185546875, -0.05731201171875, 0.0709228515625, 0.19915771484375, 0.327392578125, 0.45562744140625, 0.5838623046875, 0.71209716796875, 0.84033203125, 0.96856689453125, 1.0968017578125, 1.22503662109375, 1.353271484375, 1.48150634765625, 1.6097412109375, 1.73797607421875, 1.8662109375, 1.99444580078125, 2.1226806640625, 2.25091552734375, 2.379150390625, 2.50738525390625, 2.6356201171875, 2.76385498046875, 2.89208984375, 3.02032470703125, 3.1485595703125, 3.27679443359375, 3.405029296875, 3.53326416015625, 3.6614990234375, 3.78973388671875, 3.91796875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 12.0, 18.0, 28.0, 36.0, 58.0, 91.0, 158.0, 252.0, 348.0, 587.0, 941.0, 1478.0, 2529.0, 4118.0, 6709.0, 11199.0, 18836.0, 31384.0, 53117.0, 91622.0, 172545.0, 271997.0, 164664.0, 88159.0, 51259.0, 30614.0, 18177.0, 10809.0, 6551.0, 3902.0, 2420.0, 1444.0, 924.0, 556.0, 377.0, 214.0, 140.0, 100.0, 62.0, 31.0, 25.0, 18.0, 9.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.689453125, -3.57220458984375, -3.4549560546875, -3.33770751953125, -3.220458984375, -3.10321044921875, -2.9859619140625, -2.86871337890625, -2.75146484375, -2.63421630859375, -2.5169677734375, -2.39971923828125, -2.282470703125, -2.16522216796875, -2.0479736328125, -1.93072509765625, -1.8134765625, -1.69622802734375, -1.5789794921875, -1.46173095703125, -1.344482421875, -1.22723388671875, -1.1099853515625, -0.99273681640625, -0.87548828125, -0.75823974609375, -0.6409912109375, -0.52374267578125, -0.406494140625, -0.28924560546875, -0.1719970703125, -0.05474853515625, 0.0625, 0.17974853515625, 0.2969970703125, 0.41424560546875, 0.531494140625, 0.64874267578125, 0.7659912109375, 0.88323974609375, 1.00048828125, 1.11773681640625, 1.2349853515625, 1.35223388671875, 1.469482421875, 1.58673095703125, 1.7039794921875, 1.82122802734375, 1.9384765625, 2.05572509765625, 2.1729736328125, 2.29022216796875, 2.407470703125, 2.52471923828125, 2.6419677734375, 2.75921630859375, 2.87646484375, 2.99371337890625, 3.1109619140625, 3.22821044921875, 3.345458984375, 3.46270751953125, 3.5799560546875, 3.69720458984375, 3.814453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 17.0, 15.0, 12.0, 20.0, 24.0, 16.0, 24.0, 40.0, 38.0, 33.0, 33.0, 43.0, 75.0, 109.0, 230.0, 1443.0, 248.0, 99.0, 88.0, 64.0, 48.0, 40.0, 52.0, 38.0, 35.0, 29.0, 21.0, 23.0, 9.0, 15.0, 11.0, 12.0, 9.0, 12.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.1387939453125, -9.707275390625, -9.2757568359375, -8.84423828125, -8.4127197265625, -7.981201171875, -7.5496826171875, -7.1181640625, -6.6866455078125, -6.255126953125, -5.8236083984375, -5.39208984375, -4.9605712890625, -4.529052734375, -4.0975341796875, -3.666015625, -3.2344970703125, -2.802978515625, -2.3714599609375, -1.93994140625, -1.5084228515625, -1.076904296875, -0.6453857421875, -0.2138671875, 0.2176513671875, 0.649169921875, 1.0806884765625, 1.51220703125, 1.9437255859375, 2.375244140625, 2.8067626953125, 3.23828125, 3.6697998046875, 4.101318359375, 4.5328369140625, 4.96435546875, 5.3958740234375, 5.827392578125, 6.2589111328125, 6.6904296875, 7.1219482421875, 7.553466796875, 7.9849853515625, 8.41650390625, 8.8480224609375, 9.279541015625, 9.7110595703125, 10.142578125, 10.5740966796875, 11.005615234375, 11.4371337890625, 11.86865234375, 12.3001708984375, 12.731689453125, 13.1632080078125, 13.5947265625, 14.0262451171875, 14.457763671875, 14.8892822265625, 15.32080078125, 15.7523193359375, 16.183837890625, 16.6153564453125, 17.046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 14.0, 12.0, 16.0, 15.0, 28.0, 26.0, 39.0, 59.0, 73.0, 139.0, 215.0, 379.0, 681.0, 1371.0, 3544.0, 13219.0, 98575.0, 2461691.0, 518985.0, 35773.0, 6602.0, 2114.0, 945.0, 443.0, 282.0, 145.0, 99.0, 56.0, 52.0, 31.0, 30.0, 13.0, 17.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.390625, -21.8131103515625, -21.235595703125, -20.6580810546875, -20.08056640625, -19.5030517578125, -18.925537109375, -18.3480224609375, -17.7705078125, -17.1929931640625, -16.615478515625, -16.0379638671875, -15.46044921875, -14.8829345703125, -14.305419921875, -13.7279052734375, -13.150390625, -12.5728759765625, -11.995361328125, -11.4178466796875, -10.84033203125, -10.2628173828125, -9.685302734375, -9.1077880859375, -8.5302734375, -7.9527587890625, -7.375244140625, -6.7977294921875, -6.22021484375, -5.6427001953125, -5.065185546875, -4.4876708984375, -3.91015625, -3.3326416015625, -2.755126953125, -2.1776123046875, -1.60009765625, -1.0225830078125, -0.445068359375, 0.1324462890625, 0.7099609375, 1.2874755859375, 1.864990234375, 2.4425048828125, 3.02001953125, 3.5975341796875, 4.175048828125, 4.7525634765625, 5.330078125, 5.9075927734375, 6.485107421875, 7.0626220703125, 7.64013671875, 8.2176513671875, 8.795166015625, 9.3726806640625, 9.9501953125, 10.5277099609375, 11.105224609375, 11.6827392578125, 12.26025390625, 12.8377685546875, 13.415283203125, 13.9927978515625, 14.5703125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 10.0, 10.0, 18.0, 20.0, 26.0, 42.0, 69.0, 89.0, 112.0, 117.0, 108.0, 96.0, 80.0, 61.0, 45.0, 35.0, 22.0, 18.0, 11.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.25005531311035, -18.365293502807617, -17.480533599853516, -16.59577178955078, -15.711009979248047, -14.826248168945312, -13.941487312316895, -13.056726455688477, -12.171964645385742, -11.287202835083008, -10.40244197845459, -9.517681121826172, -8.632919311523438, -7.748157978057861, -6.863396644592285, -5.978635311126709, -5.093873977661133, -4.209112644195557, -3.3243513107299805, -2.4395899772644043, -1.5548286437988281, -0.670067310333252, 0.21469402313232422, 1.0994553565979004, 1.9842166900634766, 2.8689780235290527, 3.753739356994629, 4.638500690460205, 5.523262023925781, 6.408023357391357, 7.292784690856934, 8.177545547485352, 9.062309265136719, 9.947071075439453, 10.831831932067871, 11.716592788696289, 12.601354598999023, 13.486116409301758, 14.370877265930176, 15.255638122558594, 16.140399932861328, 17.025161743164062, 17.909923553466797, 18.7946834564209, 19.679445266723633, 20.564207077026367, 21.44896697998047, 22.333728790283203, 23.218490600585938, 24.103252410888672, 24.988014221191406, 25.872774124145508, 26.757535934448242, 27.642297744750977, 28.527057647705078, 29.411819458007812, 30.296581268310547, 31.18134307861328, 32.066104888916016, 32.95086669921875, 33.83562469482422, 34.72038650512695, 35.60514831542969, 36.48991012573242, 37.374671936035156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 6.0, 12.0, 8.0, 12.0, 13.0, 18.0, 16.0, 22.0, 23.0, 34.0, 29.0, 30.0, 44.0, 31.0, 38.0, 31.0, 39.0, 35.0, 44.0, 52.0, 40.0, 41.0, 32.0, 34.0, 22.0, 39.0, 38.0, 27.0, 19.0, 28.0, 22.0, 14.0, 17.0, 18.0, 6.0, 14.0, 10.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.16799545288086, -32.11408233642578, -31.060169219970703, -30.006256103515625, -28.95234489440918, -27.8984317779541, -26.844518661499023, -25.790605545043945, -24.7366943359375, -23.682781219482422, -22.628868103027344, -21.574954986572266, -20.52104377746582, -19.467130661010742, -18.413217544555664, -17.359304428100586, -16.305391311645508, -15.25147819519043, -14.197566032409668, -13.14365291595459, -12.089740753173828, -11.03582763671875, -9.981914520263672, -8.928001403808594, -7.874089241027832, -6.820176601409912, -5.766263961791992, -4.712350845336914, -3.658438205718994, -2.604525566101074, -1.550612449645996, -0.49669981002807617, 0.5572128295898438, 1.6111255884170532, 2.6650383472442627, 3.7189512252807617, 4.772863864898682, 5.826776504516602, 6.88068962097168, 7.9346022605896, 8.98851490020752, 10.042428016662598, 11.09634017944336, 12.150253295898438, 13.204166412353516, 14.258078575134277, 15.311991691589355, 16.365903854370117, 17.419816970825195, 18.473730087280273, 19.52764320373535, 20.581554412841797, 21.635467529296875, 22.689380645751953, 23.74329376220703, 24.79720687866211, 25.851119995117188, 26.905033111572266, 27.958946228027344, 29.012859344482422, 30.066770553588867, 31.120683670043945, 32.174598693847656, 33.22850799560547, 34.28242111206055]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 8.0, 6.0, 3.0, 4.0, 15.0, 13.0, 13.0, 18.0, 27.0, 28.0, 19.0, 25.0, 40.0, 37.0, 44.0, 40.0, 44.0, 35.0, 36.0, 48.0, 37.0, 34.0, 40.0, 29.0, 33.0, 37.0, 29.0, 36.0, 30.0, 29.0, 27.0, 17.0, 23.0, 17.0, 11.0, 7.0, 12.0, 12.0, 5.0, 7.0, 1.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.2109375, -4.083648681640625, -3.95635986328125, -3.829071044921875, -3.7017822265625, -3.574493408203125, -3.44720458984375, -3.319915771484375, -3.192626953125, -3.065338134765625, -2.93804931640625, -2.810760498046875, -2.6834716796875, -2.556182861328125, -2.42889404296875, -2.301605224609375, -2.17431640625, -2.047027587890625, -1.91973876953125, -1.792449951171875, -1.6651611328125, -1.537872314453125, -1.41058349609375, -1.283294677734375, -1.156005859375, -1.028717041015625, -0.90142822265625, -0.774139404296875, -0.6468505859375, -0.519561767578125, -0.39227294921875, -0.264984130859375, -0.1376953125, -0.010406494140625, 0.11688232421875, 0.244171142578125, 0.3714599609375, 0.498748779296875, 0.62603759765625, 0.753326416015625, 0.880615234375, 1.007904052734375, 1.13519287109375, 1.262481689453125, 1.3897705078125, 1.517059326171875, 1.64434814453125, 1.771636962890625, 1.89892578125, 2.026214599609375, 2.15350341796875, 2.280792236328125, 2.4080810546875, 2.535369873046875, 2.66265869140625, 2.789947509765625, 2.917236328125, 3.044525146484375, 3.17181396484375, 3.299102783203125, 3.4263916015625, 3.553680419921875, 3.68096923828125, 3.808258056640625, 3.935546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 0.0, 12.0, 10.0, 4.0, 5.0, 11.0, 14.0, 9.0, 20.0, 18.0, 20.0, 33.0, 43.0, 59.0, 102.0, 202.0, 414.0, 878.0, 2053.0, 5759.0, 18657.0, 75916.0, 490792.0, 2820618.0, 653498.0, 93153.0, 21542.0, 6297.0, 2262.0, 895.0, 398.0, 189.0, 112.0, 57.0, 40.0, 36.0, 35.0, 18.0, 12.0, 11.0, 16.0, 7.0, 11.0, 5.0, 5.0, 9.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-10.6484375, -10.3214111328125, -9.994384765625, -9.6673583984375, -9.34033203125, -9.0133056640625, -8.686279296875, -8.3592529296875, -8.0322265625, -7.7052001953125, -7.378173828125, -7.0511474609375, -6.72412109375, -6.3970947265625, -6.070068359375, -5.7430419921875, -5.416015625, -5.0889892578125, -4.761962890625, -4.4349365234375, -4.10791015625, -3.7808837890625, -3.453857421875, -3.1268310546875, -2.7998046875, -2.4727783203125, -2.145751953125, -1.8187255859375, -1.49169921875, -1.1646728515625, -0.837646484375, -0.5106201171875, -0.18359375, 0.1434326171875, 0.470458984375, 0.7974853515625, 1.12451171875, 1.4515380859375, 1.778564453125, 2.1055908203125, 2.4326171875, 2.7596435546875, 3.086669921875, 3.4136962890625, 3.74072265625, 4.0677490234375, 4.394775390625, 4.7218017578125, 5.048828125, 5.3758544921875, 5.702880859375, 6.0299072265625, 6.35693359375, 6.6839599609375, 7.010986328125, 7.3380126953125, 7.6650390625, 7.9920654296875, 8.319091796875, 8.6461181640625, 8.97314453125, 9.3001708984375, 9.627197265625, 9.9542236328125, 10.28125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 10.0, 6.0, 14.0, 21.0, 28.0, 37.0, 47.0, 54.0, 84.0, 126.0, 141.0, 189.0, 313.0, 394.0, 469.0, 526.0, 438.0, 282.0, 218.0, 174.0, 130.0, 88.0, 68.0, 40.0, 32.0, 36.0, 25.0, 13.0, 20.0, 8.0, 11.0, 3.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.06890869140625, -6.8487548828125, -6.62860107421875, -6.408447265625, -6.18829345703125, -5.9681396484375, -5.74798583984375, -5.52783203125, -5.30767822265625, -5.0875244140625, -4.86737060546875, -4.647216796875, -4.42706298828125, -4.2069091796875, -3.98675537109375, -3.7666015625, -3.54644775390625, -3.3262939453125, -3.10614013671875, -2.885986328125, -2.66583251953125, -2.4456787109375, -2.22552490234375, -2.00537109375, -1.78521728515625, -1.5650634765625, -1.34490966796875, -1.124755859375, -0.90460205078125, -0.6844482421875, -0.46429443359375, -0.244140625, -0.02398681640625, 0.1961669921875, 0.41632080078125, 0.636474609375, 0.85662841796875, 1.0767822265625, 1.29693603515625, 1.51708984375, 1.73724365234375, 1.9573974609375, 2.17755126953125, 2.397705078125, 2.61785888671875, 2.8380126953125, 3.05816650390625, 3.2783203125, 3.49847412109375, 3.7186279296875, 3.93878173828125, 4.158935546875, 4.37908935546875, 4.5992431640625, 4.81939697265625, 5.03955078125, 5.25970458984375, 5.4798583984375, 5.70001220703125, 5.920166015625, 6.14031982421875, 6.3604736328125, 6.58062744140625, 6.80078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 6.0, 4.0, 7.0, 22.0, 22.0, 24.0, 35.0, 61.0, 75.0, 76.0, 124.0, 167.0, 296.0, 625.0, 1946.0, 10812.0, 126136.0, 3245145.0, 764674.0, 37398.0, 4494.0, 1013.0, 371.0, 242.0, 132.0, 104.0, 70.0, 62.0, 40.0, 27.0, 21.0, 9.0, 6.0, 9.0, 10.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.4375, -26.6484375, -25.859375, -25.0703125, -24.28125, -23.4921875, -22.703125, -21.9140625, -21.125, -20.3359375, -19.546875, -18.7578125, -17.96875, -17.1796875, -16.390625, -15.6015625, -14.8125, -14.0234375, -13.234375, -12.4453125, -11.65625, -10.8671875, -10.078125, -9.2890625, -8.5, -7.7109375, -6.921875, -6.1328125, -5.34375, -4.5546875, -3.765625, -2.9765625, -2.1875, -1.3984375, -0.609375, 0.1796875, 0.96875, 1.7578125, 2.546875, 3.3359375, 4.125, 4.9140625, 5.703125, 6.4921875, 7.28125, 8.0703125, 8.859375, 9.6484375, 10.4375, 11.2265625, 12.015625, 12.8046875, 13.59375, 14.3828125, 15.171875, 15.9609375, 16.75, 17.5390625, 18.328125, 19.1171875, 19.90625, 20.6953125, 21.484375, 22.2734375, 23.0625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 32.0, 53.0, 72.0, 120.0, 138.0, 169.0, 143.0, 116.0, 84.0, 32.0, 32.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.169864654541016, -43.46155548095703, -41.75324249267578, -40.0449333190918, -38.33662414550781, -36.62831497192383, -34.920005798339844, -33.211692810058594, -31.50338363647461, -29.795074462890625, -28.086763381958008, -26.37845230102539, -24.670143127441406, -22.961833953857422, -21.253522872924805, -19.545211791992188, -17.836902618408203, -16.12859344482422, -14.420282363891602, -12.7119722366333, -11.003662109375, -9.2953519821167, -7.587041854858398, -5.878731727600098, -4.170421600341797, -2.462111473083496, -0.7538013458251953, 0.9545087814331055, 2.6628189086914062, 4.371129035949707, 6.079439163208008, 7.787749290466309, 9.496063232421875, 11.204373359680176, 12.912683486938477, 14.620993614196777, 16.329303741455078, 18.037612915039062, 19.74592399597168, 21.454235076904297, 23.16254425048828, 24.870853424072266, 26.579164505004883, 28.2874755859375, 29.995784759521484, 31.70409393310547, 33.41240692138672, 35.1207160949707, 36.82902526855469, 38.53733444213867, 40.245643615722656, 41.953956604003906, 43.66226577758789, 45.370574951171875, 47.078887939453125, 48.78719711303711, 50.495506286621094, 52.20381546020508, 53.91212463378906, 55.62043762207031, 57.3287467956543, 59.03705596923828, 60.74536895751953, 62.453678131103516, 64.1619873046875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 8.0, 9.0, 9.0, 9.0, 14.0, 14.0, 14.0, 25.0, 27.0, 27.0, 37.0, 30.0, 45.0, 43.0, 29.0, 41.0, 45.0, 48.0, 45.0, 35.0, 37.0, 25.0, 34.0, 41.0, 39.0, 42.0, 33.0, 35.0, 26.0, 24.0, 19.0, 16.0, 16.0, 16.0, 10.0, 9.0, 9.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.46826934814453, -25.6832332611084, -24.898197174072266, -24.113161087036133, -23.328125, -22.543088912963867, -21.758052825927734, -20.973018646240234, -20.18798065185547, -19.402944564819336, -18.617908477783203, -17.83287239074707, -17.047836303710938, -16.262800216674805, -15.477765083312988, -14.692728996276855, -13.907693862915039, -13.122657775878906, -12.337621688842773, -11.55258560180664, -10.767549514770508, -9.982513427734375, -9.197478294372559, -8.412442207336426, -7.627406120300293, -6.84237003326416, -6.057333946228027, -5.272298336029053, -4.48726224899292, -3.702226161956787, -2.9171905517578125, -2.1321544647216797, -1.3471183776855469, -0.5620824098587036, 0.22295355796813965, 1.0079894065856934, 1.7930254936218262, 2.578061580657959, 3.3630971908569336, 4.148133277893066, 4.933169364929199, 5.718205451965332, 6.503241539001465, 7.2882771492004395, 8.073312759399414, 8.858348846435547, 9.64338493347168, 10.428421020507812, 11.213457107543945, 11.998493194580078, 12.783529281616211, 13.568565368652344, 14.353601455688477, 15.13863754272461, 15.923672676086426, 16.708709716796875, 17.493743896484375, 18.278779983520508, 19.06381607055664, 19.848852157592773, 20.633888244628906, 21.41892433166504, 22.203960418701172, 22.988994598388672, 23.774032592773438]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 6.0, 7.0, 8.0, 17.0, 17.0, 14.0, 23.0, 30.0, 19.0, 24.0, 43.0, 39.0, 32.0, 42.0, 35.0, 41.0, 49.0, 31.0, 37.0, 38.0, 52.0, 41.0, 31.0, 23.0, 26.0, 30.0, 36.0, 13.0, 26.0, 24.0, 21.0, 21.0, 10.0, 12.0, 11.0, 12.0, 10.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.23046875, -4.09912109375, -3.9677734375, -3.83642578125, -3.705078125, -3.57373046875, -3.4423828125, -3.31103515625, -3.1796875, -3.04833984375, -2.9169921875, -2.78564453125, -2.654296875, -2.52294921875, -2.3916015625, -2.26025390625, -2.12890625, -1.99755859375, -1.8662109375, -1.73486328125, -1.603515625, -1.47216796875, -1.3408203125, -1.20947265625, -1.078125, -0.94677734375, -0.8154296875, -0.68408203125, -0.552734375, -0.42138671875, -0.2900390625, -0.15869140625, -0.02734375, 0.10400390625, 0.2353515625, 0.36669921875, 0.498046875, 0.62939453125, 0.7607421875, 0.89208984375, 1.0234375, 1.15478515625, 1.2861328125, 1.41748046875, 1.548828125, 1.68017578125, 1.8115234375, 1.94287109375, 2.07421875, 2.20556640625, 2.3369140625, 2.46826171875, 2.599609375, 2.73095703125, 2.8623046875, 2.99365234375, 3.125, 3.25634765625, 3.3876953125, 3.51904296875, 3.650390625, 3.78173828125, 3.9130859375, 4.04443359375, 4.17578125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 10.0, 10.0, 12.0, 22.0, 32.0, 51.0, 82.0, 100.0, 125.0, 191.0, 303.0, 384.0, 527.0, 737.0, 983.0, 1392.0, 1892.0, 2514.0, 3613.0, 5082.0, 6832.0, 9726.0, 13894.0, 19892.0, 29434.0, 44154.0, 69605.0, 121809.0, 279251.0, 174394.0, 90250.0, 54712.0, 35637.0, 23615.0, 16724.0, 11356.0, 8187.0, 5752.0, 4245.0, 3070.0, 2128.0, 1635.0, 1174.0, 868.0, 583.0, 433.0, 348.0, 266.0, 157.0, 106.0, 77.0, 77.0, 37.0, 32.0, 18.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.285400390625, -0.2764091491699219, -0.26741790771484375, -0.2584266662597656, -0.2494354248046875, -0.24044418334960938, -0.23145294189453125, -0.22246170043945312, -0.213470458984375, -0.20447921752929688, -0.19548797607421875, -0.18649673461914062, -0.1775054931640625, -0.16851425170898438, -0.15952301025390625, -0.15053176879882812, -0.14154052734375, -0.13254928588867188, -0.12355804443359375, -0.11456680297851562, -0.1055755615234375, -0.09658432006835938, -0.08759307861328125, -0.07860183715820312, -0.069610595703125, -0.060619354248046875, -0.05162811279296875, -0.042636871337890625, -0.0336456298828125, -0.024654388427734375, -0.01566314697265625, -0.006671905517578125, 0.0023193359375, 0.011310577392578125, 0.02030181884765625, 0.029293060302734375, 0.0382843017578125, 0.047275543212890625, 0.05626678466796875, 0.06525802612304688, 0.074249267578125, 0.08324050903320312, 0.09223175048828125, 0.10122299194335938, 0.1102142333984375, 0.11920547485351562, 0.12819671630859375, 0.13718795776367188, 0.14617919921875, 0.15517044067382812, 0.16416168212890625, 0.17315292358398438, 0.1821441650390625, 0.19113540649414062, 0.20012664794921875, 0.20911788940429688, 0.218109130859375, 0.22710037231445312, 0.23609161376953125, 0.24508285522460938, 0.2540740966796875, 0.2630653381347656, 0.27205657958984375, 0.2810478210449219, 0.2900390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 12.0, 12.0, 11.0, 16.0, 17.0, 27.0, 21.0, 24.0, 22.0, 34.0, 27.0, 37.0, 37.0, 35.0, 49.0, 48.0, 40.0, 1061.0, 40.0, 36.0, 48.0, 34.0, 35.0, 34.0, 32.0, 34.0, 27.0, 23.0, 21.0, 23.0, 23.0, 18.0, 8.0, 13.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.14227294921875, -3.0384521484375, -2.93463134765625, -2.830810546875, -2.72698974609375, -2.6231689453125, -2.51934814453125, -2.41552734375, -2.31170654296875, -2.2078857421875, -2.10406494140625, -2.000244140625, -1.89642333984375, -1.7926025390625, -1.68878173828125, -1.5849609375, -1.48114013671875, -1.3773193359375, -1.27349853515625, -1.169677734375, -1.06585693359375, -0.9620361328125, -0.85821533203125, -0.75439453125, -0.65057373046875, -0.5467529296875, -0.44293212890625, -0.339111328125, -0.23529052734375, -0.1314697265625, -0.02764892578125, 0.076171875, 0.17999267578125, 0.2838134765625, 0.38763427734375, 0.491455078125, 0.59527587890625, 0.6990966796875, 0.80291748046875, 0.90673828125, 1.01055908203125, 1.1143798828125, 1.21820068359375, 1.322021484375, 1.42584228515625, 1.5296630859375, 1.63348388671875, 1.7373046875, 1.84112548828125, 1.9449462890625, 2.04876708984375, 2.152587890625, 2.25640869140625, 2.3602294921875, 2.46405029296875, 2.56787109375, 2.67169189453125, 2.7755126953125, 2.87933349609375, 2.983154296875, 3.08697509765625, 3.1907958984375, 3.29461669921875, 3.3984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 13.0, 19.0, 12.0, 23.0, 31.0, 41.0, 66.0, 112.0, 158.0, 277.0, 391.0, 524.0, 821.0, 1284.0, 2081.0, 3147.0, 4871.0, 7945.0, 12669.0, 21111.0, 35632.0, 64504.0, 131282.0, 1416101.0, 194637.0, 85401.0, 45750.0, 26154.0, 15770.0, 9570.0, 6019.0, 3818.0, 2354.0, 1516.0, 1053.0, 690.0, 433.0, 268.0, 173.0, 128.0, 100.0, 65.0, 54.0, 16.0, 16.0, 15.0, 9.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.2197551727294922, -0.21282577514648438, -0.20589637756347656, -0.19896697998046875, -0.19203758239746094, -0.18510818481445312, -0.1781787872314453, -0.1712493896484375, -0.1643199920654297, -0.15739059448242188, -0.15046119689941406, -0.14353179931640625, -0.13660240173339844, -0.12967300415039062, -0.12274360656738281, -0.115814208984375, -0.10888481140136719, -0.10195541381835938, -0.09502601623535156, -0.08809661865234375, -0.08116722106933594, -0.07423782348632812, -0.06730842590332031, -0.0603790283203125, -0.05344963073730469, -0.046520233154296875, -0.03959083557128906, -0.03266143798828125, -0.025732040405273438, -0.018802642822265625, -0.011873245239257812, -0.00494384765625, 0.0019855499267578125, 0.008914947509765625, 0.015844345092773438, 0.02277374267578125, 0.029703140258789062, 0.036632537841796875, 0.04356193542480469, 0.0504913330078125, 0.05742073059082031, 0.06435012817382812, 0.07127952575683594, 0.07820892333984375, 0.08513832092285156, 0.09206771850585938, 0.09899711608886719, 0.105926513671875, 0.11285591125488281, 0.11978530883789062, 0.12671470642089844, 0.13364410400390625, 0.14057350158691406, 0.14750289916992188, 0.1544322967529297, 0.1613616943359375, 0.1682910919189453, 0.17522048950195312, 0.18214988708496094, 0.18907928466796875, 0.19600868225097656, 0.20293807983398438, 0.2098674774169922, 0.216796875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 13.0, 13.0, 14.0, 14.0, 15.0, 19.0, 28.0, 23.0, 34.0, 41.0, 45.0, 53.0, 70.0, 81.0, 81.0, 72.0, 59.0, 52.0, 31.0, 30.0, 37.0, 29.0, 18.0, 21.0, 11.0, 11.0, 11.0, 10.0, 7.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7000904083251953e-05, -2.6077963411808014e-05, -2.5155022740364075e-05, -2.4232082068920135e-05, -2.3309141397476196e-05, -2.2386200726032257e-05, -2.1463260054588318e-05, -2.054031938314438e-05, -1.961737871170044e-05, -1.86944380402565e-05, -1.777149736881256e-05, -1.6848556697368622e-05, -1.5925616025924683e-05, -1.5002675354480743e-05, -1.4079734683036804e-05, -1.3156794011592865e-05, -1.2233853340148926e-05, -1.1310912668704987e-05, -1.0387971997261047e-05, -9.465031325817108e-06, -8.542090654373169e-06, -7.61914998292923e-06, -6.6962093114852905e-06, -5.773268640041351e-06, -4.850327968597412e-06, -3.927387297153473e-06, -3.0044466257095337e-06, -2.0815059542655945e-06, -1.1585652828216553e-06, -2.3562461137771606e-07, 6.873160600662231e-07, 1.6102567315101624e-06, 2.5331974029541016e-06, 3.4561380743980408e-06, 4.37907874584198e-06, 5.302019417285919e-06, 6.224960088729858e-06, 7.147900760173798e-06, 8.070841431617737e-06, 8.993782103061676e-06, 9.916722774505615e-06, 1.0839663445949554e-05, 1.1762604117393494e-05, 1.2685544788837433e-05, 1.3608485460281372e-05, 1.4531426131725311e-05, 1.545436680316925e-05, 1.637730747461319e-05, 1.730024814605713e-05, 1.8223188817501068e-05, 1.9146129488945007e-05, 2.0069070160388947e-05, 2.0992010831832886e-05, 2.1914951503276825e-05, 2.2837892174720764e-05, 2.3760832846164703e-05, 2.4683773517608643e-05, 2.5606714189052582e-05, 2.652965486049652e-05, 2.745259553194046e-05, 2.83755362033844e-05, 2.929847687482834e-05, 3.0221417546272278e-05, 3.114435821771622e-05, 3.2067298889160156e-05]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 7.0, 6.0, 9.0, 17.0, 8.0, 14.0, 19.0, 31.0, 37.0, 39.0, 57.0, 86.0, 129.0, 307.0, 2735.0, 822495.0, 220217.0, 1581.0, 264.0, 125.0, 67.0, 62.0, 37.0, 37.0, 29.0, 15.0, 18.0, 15.0, 12.0, 13.0, 15.0, 5.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007119178771972656, -0.0006915256381034851, -0.0006711333990097046, -0.0006507411599159241, -0.0006303489208221436, -0.000609956681728363, -0.0005895644426345825, -0.000569172203540802, -0.0005487799644470215, -0.000528387725353241, -0.0005079954862594604, -0.00048760324716567993, -0.0004672110080718994, -0.0004468187689781189, -0.0004264265298843384, -0.00040603429079055786, -0.00038564205169677734, -0.0003652498126029968, -0.0003448575735092163, -0.0003244653344154358, -0.0003040730953216553, -0.00028368085622787476, -0.00026328861713409424, -0.00024289637804031372, -0.0002225041389465332, -0.00020211189985275269, -0.00018171966075897217, -0.00016132742166519165, -0.00014093518257141113, -0.00012054294347763062, -0.0001001507043838501, -7.975846529006958e-05, -5.936622619628906e-05, -3.8973987102508545e-05, -1.8581748008728027e-05, 1.8104910850524902e-06, 2.2202730178833008e-05, 4.2594969272613525e-05, 6.298720836639404e-05, 8.337944746017456e-05, 0.00010377168655395508, 0.0001241639256477356, 0.0001445561647415161, 0.00016494840383529663, 0.00018534064292907715, 0.00020573288202285767, 0.00022612512111663818, 0.0002465173602104187, 0.0002669095993041992, 0.00028730183839797974, 0.00030769407749176025, 0.00032808631658554077, 0.0003484785556793213, 0.0003688707947731018, 0.0003892630338668823, 0.00040965527296066284, 0.00043004751205444336, 0.0004504397511482239, 0.0004708319902420044, 0.0004912242293357849, 0.0005116164684295654, 0.000532008707523346, 0.0005524009466171265, 0.000572793185710907, 0.0005931854248046875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 5.0, 10.0, 54.0, 301.0, 437.0, 178.0, 18.0, 12.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447019227896817e-05, -1.0921427929133642e-05, -8.395836630370468e-06, -5.870246241101995e-06, -3.3446549423388205e-06, -8.19063643575646e-07, 1.7065267456928268e-06, 4.232118953950703e-06, 6.757709343219176e-06, 9.28330064198235e-06, 1.1808891940745525e-05, 1.4334482330013998e-05, 1.6860074538271874e-05, 1.9385664927540347e-05, 2.191125531680882e-05, 2.4436847525066696e-05, 2.696243791433517e-05, 2.948802830360364e-05, 3.201362051186152e-05, 3.453921090112999e-05, 3.7064801290398464e-05, 3.9590391679666936e-05, 4.2115985706914216e-05, 4.464157609618269e-05, 4.716716648545116e-05, 4.9692756874719635e-05, 5.221834726398811e-05, 5.474394129123539e-05, 5.726953168050386e-05, 5.979512206977233e-05, 6.232071609701961e-05, 6.484630284830928e-05, 6.737189687555656e-05, 6.989749090280384e-05, 7.24230776540935e-05, 7.494867168134078e-05, 7.747425843263045e-05, 7.999985245987773e-05, 8.25254392111674e-05, 8.505103323841467e-05, 8.757662726566195e-05, 9.010222129290923e-05, 9.26278080441989e-05, 9.515340207144618e-05, 9.767898882273585e-05, 0.00010020458284998313, 0.0001027301768772304, 0.00010525576362852007, 0.00010778135037980974, 0.00011030694440705702, 0.00011283253115834668, 0.00011535812518559396, 0.00011788371193688363, 0.00012040930596413091, 0.0001229348999913782, 0.00012546048674266785, 0.00012798608804587275, 0.00013051167479716241, 0.0001330372761003673, 0.00013556286285165697, 0.00013808844960294664, 0.00014061405090615153, 0.0001431396376574412, 0.00014566522440873086, 0.00014819081116002053]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 3.0, 13.0, 8.0, 8.0, 12.0, 11.0, 9.0, 13.0, 23.0, 23.0, 11.0, 22.0, 33.0, 36.0, 37.0, 46.0, 43.0, 58.0, 28.0, 32.0, 32.0, 45.0, 38.0, 39.0, 39.0, 37.0, 29.0, 39.0, 24.0, 25.0, 25.0, 25.0, 20.0, 13.0, 15.0, 12.0, 10.0, 16.0, 12.0, 5.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5914440155029297e-05, -1.5432946383953094e-05, -1.4951452612876892e-05, -1.446995884180069e-05, -1.3988465070724487e-05, -1.3506971299648285e-05, -1.3025477528572083e-05, -1.254398375749588e-05, -1.2062489986419678e-05, -1.1580996215343475e-05, -1.1099502444267273e-05, -1.061800867319107e-05, -1.0136514902114868e-05, -9.655021131038666e-06, -9.173527359962463e-06, -8.692033588886261e-06, -8.210539817810059e-06, -7.729046046733856e-06, -7.247552275657654e-06, -6.766058504581451e-06, -6.284564733505249e-06, -5.803070962429047e-06, -5.321577191352844e-06, -4.840083420276642e-06, -4.3585896492004395e-06, -3.877095878124237e-06, -3.3956021070480347e-06, -2.9141083359718323e-06, -2.43261456489563e-06, -1.9511207938194275e-06, -1.469627022743225e-06, -9.881332516670227e-07, -5.066394805908203e-07, -2.514570951461792e-08, 4.5634806156158447e-07, 9.378418326377869e-07, 1.4193356037139893e-06, 1.9008293747901917e-06, 2.382323145866394e-06, 2.8638169169425964e-06, 3.345310688018799e-06, 3.826804459095001e-06, 4.308298230171204e-06, 4.789792001247406e-06, 5.271285772323608e-06, 5.752779543399811e-06, 6.234273314476013e-06, 6.7157670855522156e-06, 7.197260856628418e-06, 7.67875462770462e-06, 8.160248398780823e-06, 8.641742169857025e-06, 9.123235940933228e-06, 9.60472971200943e-06, 1.0086223483085632e-05, 1.0567717254161835e-05, 1.1049211025238037e-05, 1.153070479631424e-05, 1.2012198567390442e-05, 1.2493692338466644e-05, 1.2975186109542847e-05, 1.3456679880619049e-05, 1.3938173651695251e-05, 1.4419667422771454e-05, 1.4901161193847656e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 6.0, 7.0, 8.0, 17.0, 17.0, 14.0, 23.0, 30.0, 19.0, 24.0, 43.0, 39.0, 32.0, 42.0, 35.0, 41.0, 49.0, 31.0, 37.0, 38.0, 52.0, 41.0, 31.0, 23.0, 26.0, 30.0, 36.0, 13.0, 26.0, 24.0, 21.0, 21.0, 10.0, 12.0, 11.0, 12.0, 10.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.23046875, -4.09912109375, -3.9677734375, -3.83642578125, -3.705078125, -3.57373046875, -3.4423828125, -3.31103515625, -3.1796875, -3.04833984375, -2.9169921875, -2.78564453125, -2.654296875, -2.52294921875, -2.3916015625, -2.26025390625, -2.12890625, -1.99755859375, -1.8662109375, -1.73486328125, -1.603515625, -1.47216796875, -1.3408203125, -1.20947265625, -1.078125, -0.94677734375, -0.8154296875, -0.68408203125, -0.552734375, -0.42138671875, -0.2900390625, -0.15869140625, -0.02734375, 0.10400390625, 0.2353515625, 0.36669921875, 0.498046875, 0.62939453125, 0.7607421875, 0.89208984375, 1.0234375, 1.15478515625, 1.2861328125, 1.41748046875, 1.548828125, 1.68017578125, 1.8115234375, 1.94287109375, 2.07421875, 2.20556640625, 2.3369140625, 2.46826171875, 2.599609375, 2.73095703125, 2.8623046875, 2.99365234375, 3.125, 3.25634765625, 3.3876953125, 3.51904296875, 3.650390625, 3.78173828125, 3.9130859375, 4.04443359375, 4.17578125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 10.0, 7.0, 5.0, 15.0, 24.0, 34.0, 43.0, 65.0, 82.0, 131.0, 182.0, 270.0, 413.0, 687.0, 1202.0, 1881.0, 3266.0, 5720.0, 10366.0, 19557.0, 42236.0, 109940.0, 315269.0, 329968.0, 117271.0, 44371.0, 20429.0, 10637.0, 5891.0, 3336.0, 2022.0, 1131.0, 720.0, 440.0, 311.0, 168.0, 144.0, 83.0, 62.0, 43.0, 37.0, 25.0, 15.0, 10.0, 13.0, 5.0, 7.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.26904296875, -5.0810546875, -4.89306640625, -4.705078125, -4.51708984375, -4.3291015625, -4.14111328125, -3.953125, -3.76513671875, -3.5771484375, -3.38916015625, -3.201171875, -3.01318359375, -2.8251953125, -2.63720703125, -2.44921875, -2.26123046875, -2.0732421875, -1.88525390625, -1.697265625, -1.50927734375, -1.3212890625, -1.13330078125, -0.9453125, -0.75732421875, -0.5693359375, -0.38134765625, -0.193359375, -0.00537109375, 0.1826171875, 0.37060546875, 0.55859375, 0.74658203125, 0.9345703125, 1.12255859375, 1.310546875, 1.49853515625, 1.6865234375, 1.87451171875, 2.0625, 2.25048828125, 2.4384765625, 2.62646484375, 2.814453125, 3.00244140625, 3.1904296875, 3.37841796875, 3.56640625, 3.75439453125, 3.9423828125, 4.13037109375, 4.318359375, 4.50634765625, 4.6943359375, 4.88232421875, 5.0703125, 5.25830078125, 5.4462890625, 5.63427734375, 5.822265625, 6.01025390625, 6.1982421875, 6.38623046875, 6.57421875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 10.0, 4.0, 12.0, 23.0, 10.0, 14.0, 17.0, 28.0, 14.0, 26.0, 28.0, 33.0, 33.0, 36.0, 48.0, 69.0, 71.0, 117.0, 283.0, 1459.0, 193.0, 88.0, 70.0, 52.0, 30.0, 38.0, 31.0, 35.0, 30.0, 10.0, 17.0, 19.0, 19.0, 13.0, 13.0, 6.0, 13.0, 8.0, 6.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7265625, -12.306396484375, -11.88623046875, -11.466064453125, -11.0458984375, -10.625732421875, -10.20556640625, -9.785400390625, -9.365234375, -8.945068359375, -8.52490234375, -8.104736328125, -7.6845703125, -7.264404296875, -6.84423828125, -6.424072265625, -6.00390625, -5.583740234375, -5.16357421875, -4.743408203125, -4.3232421875, -3.903076171875, -3.48291015625, -3.062744140625, -2.642578125, -2.222412109375, -1.80224609375, -1.382080078125, -0.9619140625, -0.541748046875, -0.12158203125, 0.298583984375, 0.71875, 1.138916015625, 1.55908203125, 1.979248046875, 2.3994140625, 2.819580078125, 3.23974609375, 3.659912109375, 4.080078125, 4.500244140625, 4.92041015625, 5.340576171875, 5.7607421875, 6.180908203125, 6.60107421875, 7.021240234375, 7.44140625, 7.861572265625, 8.28173828125, 8.701904296875, 9.1220703125, 9.542236328125, 9.96240234375, 10.382568359375, 10.802734375, 11.222900390625, 11.64306640625, 12.063232421875, 12.4833984375, 12.903564453125, 13.32373046875, 13.743896484375, 14.1640625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 10.0, 2.0, 4.0, 9.0, 12.0, 12.0, 15.0, 22.0, 19.0, 28.0, 29.0, 40.0, 42.0, 62.0, 82.0, 116.0, 192.0, 316.0, 871.0, 3986.0, 24894.0, 404787.0, 2599849.0, 96266.0, 10558.0, 1994.0, 606.0, 244.0, 144.0, 115.0, 72.0, 66.0, 46.0, 39.0, 41.0, 21.0, 18.0, 17.0, 19.0, 12.0, 9.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-19.703125, -19.12841796875, -18.5537109375, -17.97900390625, -17.404296875, -16.82958984375, -16.2548828125, -15.68017578125, -15.10546875, -14.53076171875, -13.9560546875, -13.38134765625, -12.806640625, -12.23193359375, -11.6572265625, -11.08251953125, -10.5078125, -9.93310546875, -9.3583984375, -8.78369140625, -8.208984375, -7.63427734375, -7.0595703125, -6.48486328125, -5.91015625, -5.33544921875, -4.7607421875, -4.18603515625, -3.611328125, -3.03662109375, -2.4619140625, -1.88720703125, -1.3125, -0.73779296875, -0.1630859375, 0.41162109375, 0.986328125, 1.56103515625, 2.1357421875, 2.71044921875, 3.28515625, 3.85986328125, 4.4345703125, 5.00927734375, 5.583984375, 6.15869140625, 6.7333984375, 7.30810546875, 7.8828125, 8.45751953125, 9.0322265625, 9.60693359375, 10.181640625, 10.75634765625, 11.3310546875, 11.90576171875, 12.48046875, 13.05517578125, 13.6298828125, 14.20458984375, 14.779296875, 15.35400390625, 15.9287109375, 16.50341796875, 17.078125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 28.0, 60.0, 83.0, 104.0, 170.0, 159.0, 125.0, 92.0, 85.0, 38.0, 21.0, 16.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.852945327758789, -10.896310806274414, -9.939676284790039, -8.983041763305664, -8.026407241821289, -7.069773197174072, -6.1131391525268555, -5.1565046310424805, -4.1998701095581055, -3.2432355880737305, -2.2866013050079346, -1.3299670219421387, -0.37333250045776367, 0.5833020210266113, 1.5399360656738281, 2.496570587158203, 3.453205108642578, 4.409839630126953, 5.366474151611328, 6.323108196258545, 7.27974271774292, 8.236377716064453, 9.193011283874512, 10.149645805358887, 11.106280326843262, 12.062914848327637, 13.019549369812012, 13.97618293762207, 14.932817459106445, 15.88945198059082, 16.846086502075195, 17.80272102355957, 18.759357452392578, 19.715991973876953, 20.672626495361328, 21.629261016845703, 22.585895538330078, 23.542530059814453, 24.499164581298828, 25.455799102783203, 26.412433624267578, 27.369068145751953, 28.325702667236328, 29.282337188720703, 30.238971710205078, 31.195606231689453, 32.15224075317383, 33.1088752746582, 34.06550598144531, 35.02214050292969, 35.97877502441406, 36.93540954589844, 37.89204406738281, 38.84867858886719, 39.80531311035156, 40.76194763183594, 41.71858215332031, 42.67521667480469, 43.63185119628906, 44.58848571777344, 45.54512023925781, 46.50175476074219, 47.45838928222656, 48.41502380371094, 49.37165832519531]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 5.0, 4.0, 12.0, 5.0, 8.0, 19.0, 18.0, 14.0, 24.0, 31.0, 35.0, 31.0, 33.0, 26.0, 37.0, 30.0, 41.0, 50.0, 41.0, 37.0, 46.0, 34.0, 41.0, 27.0, 30.0, 30.0, 34.0, 22.0, 34.0, 22.0, 26.0, 23.0, 16.0, 11.0, 19.0, 14.0, 6.0, 9.0, 9.0, 3.0, 5.0, 7.0, 8.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-35.807655334472656, -34.699684143066406, -33.591712951660156, -32.483741760253906, -31.37577247619629, -30.26780128479004, -29.159832000732422, -28.051860809326172, -26.943889617919922, -25.835918426513672, -24.727947235107422, -23.619977951049805, -22.512006759643555, -21.404035568237305, -20.296066284179688, -19.188095092773438, -18.080123901367188, -16.972152709960938, -15.864182472229004, -14.75621223449707, -13.64824104309082, -12.54026985168457, -11.432299613952637, -10.324329376220703, -9.216358184814453, -8.108386993408203, -7.0004167556762695, -5.892446041107178, -4.784475326538086, -3.676504611968994, -2.5685338973999023, -1.4605631828308105, -0.35259246826171875, 0.755378246307373, 1.8633489608764648, 2.9713196754455566, 4.079290390014648, 5.18726110458374, 6.295231819152832, 7.403202533721924, 8.511173248291016, 9.619144439697266, 10.7271146774292, 11.835084915161133, 12.943056106567383, 14.051027297973633, 15.158997535705566, 16.2669677734375, 17.37493896484375, 18.48291015625, 19.59088134765625, 20.698850631713867, 21.806821823120117, 22.914793014526367, 24.022762298583984, 25.130733489990234, 26.238704681396484, 27.346675872802734, 28.454647064208984, 29.5626163482666, 30.67058753967285, 31.7785587310791, 32.88652801513672, 33.99449920654297, 35.10247039794922]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 7.0, 1.0, 4.0, 8.0, 7.0, 11.0, 17.0, 14.0, 10.0, 15.0, 19.0, 19.0, 30.0, 27.0, 35.0, 28.0, 42.0, 38.0, 33.0, 50.0, 49.0, 37.0, 47.0, 29.0, 45.0, 34.0, 34.0, 34.0, 34.0, 27.0, 25.0, 27.0, 24.0, 16.0, 21.0, 25.0, 13.0, 16.0, 11.0, 12.0, 3.0, 4.0, 6.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.484375, -4.34564208984375, -4.2069091796875, -4.06817626953125, -3.929443359375, -3.79071044921875, -3.6519775390625, -3.51324462890625, -3.37451171875, -3.23577880859375, -3.0970458984375, -2.95831298828125, -2.819580078125, -2.68084716796875, -2.5421142578125, -2.40338134765625, -2.2646484375, -2.12591552734375, -1.9871826171875, -1.84844970703125, -1.709716796875, -1.57098388671875, -1.4322509765625, -1.29351806640625, -1.15478515625, -1.01605224609375, -0.8773193359375, -0.73858642578125, -0.599853515625, -0.46112060546875, -0.3223876953125, -0.18365478515625, -0.044921875, 0.09381103515625, 0.2325439453125, 0.37127685546875, 0.510009765625, 0.64874267578125, 0.7874755859375, 0.92620849609375, 1.06494140625, 1.20367431640625, 1.3424072265625, 1.48114013671875, 1.619873046875, 1.75860595703125, 1.8973388671875, 2.03607177734375, 2.1748046875, 2.31353759765625, 2.4522705078125, 2.59100341796875, 2.729736328125, 2.86846923828125, 3.0072021484375, 3.14593505859375, 3.28466796875, 3.42340087890625, 3.5621337890625, 3.70086669921875, 3.839599609375, 3.97833251953125, 4.1170654296875, 4.25579833984375, 4.39453125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 9.0, 14.0, 13.0, 24.0, 39.0, 34.0, 59.0, 70.0, 124.0, 151.0, 270.0, 406.0, 687.0, 1169.0, 2229.0, 4376.0, 9342.0, 23015.0, 64632.0, 233723.0, 1180652.0, 2051873.0, 452583.0, 108382.0, 35154.0, 13260.0, 5641.0, 2734.0, 1442.0, 811.0, 460.0, 293.0, 198.0, 104.0, 77.0, 54.0, 43.0, 33.0, 24.0, 16.0, 11.0, 14.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.58984375, -7.3466796875, -7.103515625, -6.8603515625, -6.6171875, -6.3740234375, -6.130859375, -5.8876953125, -5.64453125, -5.4013671875, -5.158203125, -4.9150390625, -4.671875, -4.4287109375, -4.185546875, -3.9423828125, -3.69921875, -3.4560546875, -3.212890625, -2.9697265625, -2.7265625, -2.4833984375, -2.240234375, -1.9970703125, -1.75390625, -1.5107421875, -1.267578125, -1.0244140625, -0.78125, -0.5380859375, -0.294921875, -0.0517578125, 0.19140625, 0.4345703125, 0.677734375, 0.9208984375, 1.1640625, 1.4072265625, 1.650390625, 1.8935546875, 2.13671875, 2.3798828125, 2.623046875, 2.8662109375, 3.109375, 3.3525390625, 3.595703125, 3.8388671875, 4.08203125, 4.3251953125, 4.568359375, 4.8115234375, 5.0546875, 5.2978515625, 5.541015625, 5.7841796875, 6.02734375, 6.2705078125, 6.513671875, 6.7568359375, 7.0, 7.2431640625, 7.486328125, 7.7294921875, 7.97265625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 12.0, 12.0, 20.0, 22.0, 33.0, 34.0, 47.0, 58.0, 77.0, 100.0, 140.0, 189.0, 252.0, 330.0, 450.0, 504.0, 444.0, 304.0, 225.0, 191.0, 143.0, 101.0, 95.0, 61.0, 50.0, 46.0, 25.0, 13.0, 15.0, 19.0, 5.0, 13.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.35546875, -7.14166259765625, -6.9278564453125, -6.71405029296875, -6.500244140625, -6.28643798828125, -6.0726318359375, -5.85882568359375, -5.64501953125, -5.43121337890625, -5.2174072265625, -5.00360107421875, -4.789794921875, -4.57598876953125, -4.3621826171875, -4.14837646484375, -3.9345703125, -3.72076416015625, -3.5069580078125, -3.29315185546875, -3.079345703125, -2.86553955078125, -2.6517333984375, -2.43792724609375, -2.22412109375, -2.01031494140625, -1.7965087890625, -1.58270263671875, -1.368896484375, -1.15509033203125, -0.9412841796875, -0.72747802734375, -0.513671875, -0.29986572265625, -0.0860595703125, 0.12774658203125, 0.341552734375, 0.55535888671875, 0.7691650390625, 0.98297119140625, 1.19677734375, 1.41058349609375, 1.6243896484375, 1.83819580078125, 2.052001953125, 2.26580810546875, 2.4796142578125, 2.69342041015625, 2.9072265625, 3.12103271484375, 3.3348388671875, 3.54864501953125, 3.762451171875, 3.97625732421875, 4.1900634765625, 4.40386962890625, 4.61767578125, 4.83148193359375, 5.0452880859375, 5.25909423828125, 5.472900390625, 5.68670654296875, 5.9005126953125, 6.11431884765625, 6.328125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 8.0, 5.0, 19.0, 18.0, 33.0, 36.0, 72.0, 74.0, 112.0, 177.0, 376.0, 992.0, 4513.0, 35377.0, 642236.0, 3340255.0, 153114.0, 13460.0, 2135.0, 574.0, 238.0, 151.0, 89.0, 65.0, 45.0, 33.0, 19.0, 23.0, 12.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.478271484375, -20.69091796875, -19.903564453125, -19.1162109375, -18.328857421875, -17.54150390625, -16.754150390625, -15.966796875, -15.179443359375, -14.39208984375, -13.604736328125, -12.8173828125, -12.030029296875, -11.24267578125, -10.455322265625, -9.66796875, -8.880615234375, -8.09326171875, -7.305908203125, -6.5185546875, -5.731201171875, -4.94384765625, -4.156494140625, -3.369140625, -2.581787109375, -1.79443359375, -1.007080078125, -0.2197265625, 0.567626953125, 1.35498046875, 2.142333984375, 2.9296875, 3.717041015625, 4.50439453125, 5.291748046875, 6.0791015625, 6.866455078125, 7.65380859375, 8.441162109375, 9.228515625, 10.015869140625, 10.80322265625, 11.590576171875, 12.3779296875, 13.165283203125, 13.95263671875, 14.739990234375, 15.52734375, 16.314697265625, 17.10205078125, 17.889404296875, 18.6767578125, 19.464111328125, 20.25146484375, 21.038818359375, 21.826171875, 22.613525390625, 23.40087890625, 24.188232421875, 24.9755859375, 25.762939453125, 26.55029296875, 27.337646484375, 28.125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 14.0, 16.0, 28.0, 81.0, 97.0, 129.0, 162.0, 133.0, 136.0, 95.0, 58.0, 29.0, 13.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.72816848754883, -58.053497314453125, -56.37882614135742, -54.70415496826172, -53.02947998046875, -51.35480880737305, -49.680137634277344, -48.00546646118164, -46.33079528808594, -44.656124114990234, -42.98145294189453, -41.30677795410156, -39.63210678100586, -37.957435607910156, -36.28276443481445, -34.60809326171875, -32.93341827392578, -31.258747100830078, -29.584074020385742, -27.90940284729004, -26.234729766845703, -24.56005859375, -22.885387420654297, -21.210716247558594, -19.536043167114258, -17.861371994018555, -16.18669891357422, -14.512027740478516, -12.837355613708496, -11.162683486938477, -9.488012313842773, -7.813340187072754, -6.138668060302734, -4.463995933532715, -2.7893242835998535, -1.1146526336669922, 0.5600194931030273, 2.234691619873047, 3.90936279296875, 5.5840349197387695, 7.258707046508789, 8.933379173278809, 10.608051300048828, 12.282722473144531, 13.95739459991455, 15.63206672668457, 17.306737899780273, 18.98141098022461, 20.656082153320312, 22.330753326416016, 24.00542640686035, 25.680097579956055, 27.35477066040039, 29.029441833496094, 30.704113006591797, 32.3787841796875, 34.05345916748047, 35.72813034057617, 37.402801513671875, 39.077476501464844, 40.75214767456055, 42.42681884765625, 44.10149002075195, 45.776161193847656, 47.45083236694336]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 8.0, 12.0, 9.0, 9.0, 16.0, 13.0, 22.0, 20.0, 25.0, 35.0, 34.0, 28.0, 34.0, 42.0, 31.0, 41.0, 45.0, 57.0, 46.0, 43.0, 46.0, 36.0, 45.0, 31.0, 34.0, 36.0, 31.0, 20.0, 23.0, 30.0, 20.0, 14.0, 14.0, 13.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53095245361328, -23.646648406982422, -22.762346267700195, -21.87804412841797, -20.99374008178711, -20.10943603515625, -19.225133895874023, -18.340831756591797, -17.456527709960938, -16.572223663330078, -15.687921524047852, -14.803618431091309, -13.919315338134766, -13.035012245178223, -12.15070915222168, -11.266406059265137, -10.382102966308594, -9.49779987335205, -8.613496780395508, -7.729193687438965, -6.844890594482422, -5.960587501525879, -5.076284408569336, -4.191981315612793, -3.30767822265625, -2.423375129699707, -1.539072036743164, -0.6547689437866211, 0.22953414916992188, 1.1138372421264648, 1.9981403350830078, 2.882443428039551, 3.7667465209960938, 4.651049613952637, 5.53535270690918, 6.419655799865723, 7.303958892822266, 8.188261985778809, 9.072565078735352, 9.956868171691895, 10.841171264648438, 11.72547435760498, 12.609777450561523, 13.494080543518066, 14.37838363647461, 15.262686729431152, 16.146989822387695, 17.031291961669922, 17.91559600830078, 18.79990005493164, 19.684202194213867, 20.568504333496094, 21.452808380126953, 22.337112426757812, 23.22141456604004, 24.105716705322266, 24.990020751953125, 25.874324798583984, 26.75862693786621, 27.642929077148438, 28.527233123779297, 29.411537170410156, 30.295839309692383, 31.18014144897461, 32.06444549560547]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 10.0, 12.0, 23.0, 15.0, 17.0, 27.0, 19.0, 31.0, 30.0, 27.0, 49.0, 43.0, 49.0, 25.0, 52.0, 45.0, 41.0, 47.0, 47.0, 32.0, 41.0, 33.0, 28.0, 26.0, 33.0, 21.0, 28.0, 14.0, 13.0, 14.0, 17.0, 11.0, 8.0, 5.0, 7.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27203369140625, -4.1300048828125, -3.98797607421875, -3.845947265625, -3.70391845703125, -3.5618896484375, -3.41986083984375, -3.27783203125, -3.13580322265625, -2.9937744140625, -2.85174560546875, -2.709716796875, -2.56768798828125, -2.4256591796875, -2.28363037109375, -2.1416015625, -1.99957275390625, -1.8575439453125, -1.71551513671875, -1.573486328125, -1.43145751953125, -1.2894287109375, -1.14739990234375, -1.00537109375, -0.86334228515625, -0.7213134765625, -0.57928466796875, -0.437255859375, -0.29522705078125, -0.1531982421875, -0.01116943359375, 0.130859375, 0.27288818359375, 0.4149169921875, 0.55694580078125, 0.698974609375, 0.84100341796875, 0.9830322265625, 1.12506103515625, 1.26708984375, 1.40911865234375, 1.5511474609375, 1.69317626953125, 1.835205078125, 1.97723388671875, 2.1192626953125, 2.26129150390625, 2.4033203125, 2.54534912109375, 2.6873779296875, 2.82940673828125, 2.971435546875, 3.11346435546875, 3.2554931640625, 3.39752197265625, 3.53955078125, 3.68157958984375, 3.8236083984375, 3.96563720703125, 4.107666015625, 4.24969482421875, 4.3917236328125, 4.53375244140625, 4.67578125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 10.0, 14.0, 22.0, 41.0, 53.0, 76.0, 120.0, 172.0, 273.0, 414.0, 666.0, 974.0, 1593.0, 2552.0, 3962.0, 6351.0, 10278.0, 16434.0, 27811.0, 47606.0, 89186.0, 209894.0, 360437.0, 120717.0, 61064.0, 34304.0, 20244.0, 12347.0, 7645.0, 4780.0, 2974.0, 1945.0, 1255.0, 793.0, 533.0, 328.0, 221.0, 151.0, 99.0, 62.0, 41.0, 45.0, 17.0, 14.0, 14.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.40859222412109375, -0.3950653076171875, -0.38153839111328125, -0.368011474609375, -0.35448455810546875, -0.3409576416015625, -0.32743072509765625, -0.31390380859375, -0.30037689208984375, -0.2868499755859375, -0.27332305908203125, -0.259796142578125, -0.24626922607421875, -0.2327423095703125, -0.21921539306640625, -0.2056884765625, -0.19216156005859375, -0.1786346435546875, -0.16510772705078125, -0.151580810546875, -0.13805389404296875, -0.1245269775390625, -0.11100006103515625, -0.09747314453125, -0.08394622802734375, -0.0704193115234375, -0.05689239501953125, -0.043365478515625, -0.02983856201171875, -0.0163116455078125, -0.00278472900390625, 0.0107421875, 0.02426910400390625, 0.0377960205078125, 0.05132293701171875, 0.064849853515625, 0.07837677001953125, 0.0919036865234375, 0.10543060302734375, 0.11895751953125, 0.13248443603515625, 0.1460113525390625, 0.15953826904296875, 0.173065185546875, 0.18659210205078125, 0.2001190185546875, 0.21364593505859375, 0.2271728515625, 0.24069976806640625, 0.2542266845703125, 0.26775360107421875, 0.281280517578125, 0.29480743408203125, 0.3083343505859375, 0.32186126708984375, 0.33538818359375, 0.34891510009765625, 0.3624420166015625, 0.37596893310546875, 0.389495849609375, 0.40302276611328125, 0.4165496826171875, 0.43007659912109375, 0.443603515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 8.0, 9.0, 9.0, 8.0, 10.0, 11.0, 19.0, 20.0, 19.0, 26.0, 27.0, 35.0, 30.0, 31.0, 37.0, 36.0, 39.0, 46.0, 42.0, 43.0, 1058.0, 38.0, 37.0, 44.0, 41.0, 28.0, 34.0, 37.0, 28.0, 22.0, 28.0, 18.0, 20.0, 16.0, 13.0, 10.0, 14.0, 4.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.162109375, -3.06060791015625, -2.9591064453125, -2.85760498046875, -2.756103515625, -2.65460205078125, -2.5531005859375, -2.45159912109375, -2.35009765625, -2.24859619140625, -2.1470947265625, -2.04559326171875, -1.944091796875, -1.84259033203125, -1.7410888671875, -1.63958740234375, -1.5380859375, -1.43658447265625, -1.3350830078125, -1.23358154296875, -1.132080078125, -1.03057861328125, -0.9290771484375, -0.82757568359375, -0.72607421875, -0.62457275390625, -0.5230712890625, -0.42156982421875, -0.320068359375, -0.21856689453125, -0.1170654296875, -0.01556396484375, 0.0859375, 0.18743896484375, 0.2889404296875, 0.39044189453125, 0.491943359375, 0.59344482421875, 0.6949462890625, 0.79644775390625, 0.89794921875, 0.99945068359375, 1.1009521484375, 1.20245361328125, 1.303955078125, 1.40545654296875, 1.5069580078125, 1.60845947265625, 1.7099609375, 1.81146240234375, 1.9129638671875, 2.01446533203125, 2.115966796875, 2.21746826171875, 2.3189697265625, 2.42047119140625, 2.52197265625, 2.62347412109375, 2.7249755859375, 2.82647705078125, 2.927978515625, 3.02947998046875, 3.1309814453125, 3.23248291015625, 3.333984375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 4.0, 10.0, 11.0, 26.0, 40.0, 39.0, 67.0, 84.0, 157.0, 202.0, 273.0, 405.0, 621.0, 940.0, 1278.0, 2052.0, 2980.0, 4750.0, 7178.0, 11741.0, 19002.0, 31853.0, 56778.0, 109615.0, 1352363.0, 260033.0, 101995.0, 53056.0, 30103.0, 18008.0, 11062.0, 7098.0, 4466.0, 2892.0, 1965.0, 1267.0, 835.0, 609.0, 400.0, 277.0, 183.0, 149.0, 81.0, 50.0, 37.0, 30.0, 26.0, 15.0, 8.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.222900390625, -0.21613502502441406, -0.20936965942382812, -0.2026042938232422, -0.19583892822265625, -0.1890735626220703, -0.18230819702148438, -0.17554283142089844, -0.1687774658203125, -0.16201210021972656, -0.15524673461914062, -0.1484813690185547, -0.14171600341796875, -0.1349506378173828, -0.12818527221679688, -0.12141990661621094, -0.114654541015625, -0.10788917541503906, -0.10112380981445312, -0.09435844421386719, -0.08759307861328125, -0.08082771301269531, -0.07406234741210938, -0.06729698181152344, -0.0605316162109375, -0.05376625061035156, -0.047000885009765625, -0.04023551940917969, -0.03347015380859375, -0.026704788208007812, -0.019939422607421875, -0.013174057006835938, -0.00640869140625, 0.0003566741943359375, 0.007122039794921875, 0.013887405395507812, 0.02065277099609375, 0.027418136596679688, 0.034183502197265625, 0.04094886779785156, 0.0477142333984375, 0.05447959899902344, 0.061244964599609375, 0.06801033020019531, 0.07477569580078125, 0.08154106140136719, 0.08830642700195312, 0.09507179260253906, 0.101837158203125, 0.10860252380371094, 0.11536788940429688, 0.12213325500488281, 0.12889862060546875, 0.1356639862060547, 0.14242935180664062, 0.14919471740722656, 0.1559600830078125, 0.16272544860839844, 0.16949081420898438, 0.1762561798095703, 0.18302154541015625, 0.1897869110107422, 0.19655227661132812, 0.20331764221191406, 0.2100830078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 4.0, 8.0, 18.0, 17.0, 19.0, 16.0, 19.0, 39.0, 30.0, 46.0, 61.0, 78.0, 101.0, 111.0, 79.0, 66.0, 51.0, 44.0, 32.0, 27.0, 18.0, 25.0, 13.0, 12.0, 11.0, 7.0, 5.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.713369369506836e-05, -3.594439476728439e-05, -3.475509583950043e-05, -3.356579691171646e-05, -3.2376497983932495e-05, -3.118719905614853e-05, -2.9997900128364563e-05, -2.8808601200580597e-05, -2.761930227279663e-05, -2.6430003345012665e-05, -2.52407044172287e-05, -2.4051405489444733e-05, -2.2862106561660767e-05, -2.16728076338768e-05, -2.0483508706092834e-05, -1.929420977830887e-05, -1.8104910850524902e-05, -1.6915611922740936e-05, -1.572631299495697e-05, -1.4537014067173004e-05, -1.3347715139389038e-05, -1.2158416211605072e-05, -1.0969117283821106e-05, -9.77981835603714e-06, -8.590519428253174e-06, -7.401220500469208e-06, -6.211921572685242e-06, -5.022622644901276e-06, -3.8333237171173096e-06, -2.6440247893333435e-06, -1.4547258615493774e-06, -2.654269337654114e-07, 9.238719940185547e-07, 2.1131709218025208e-06, 3.302469849586487e-06, 4.491768777370453e-06, 5.681067705154419e-06, 6.870366632938385e-06, 8.059665560722351e-06, 9.248964488506317e-06, 1.0438263416290283e-05, 1.162756234407425e-05, 1.2816861271858215e-05, 1.4006160199642181e-05, 1.5195459127426147e-05, 1.6384758055210114e-05, 1.757405698299408e-05, 1.8763355910778046e-05, 1.9952654838562012e-05, 2.1141953766345978e-05, 2.2331252694129944e-05, 2.352055162191391e-05, 2.4709850549697876e-05, 2.5899149477481842e-05, 2.7088448405265808e-05, 2.8277747333049774e-05, 2.946704626083374e-05, 3.0656345188617706e-05, 3.184564411640167e-05, 3.303494304418564e-05, 3.4224241971969604e-05, 3.541354089975357e-05, 3.660283982753754e-05, 3.77921387553215e-05, 3.898143768310547e-05]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 6.0, 7.0, 8.0, 5.0, 10.0, 13.0, 19.0, 29.0, 35.0, 45.0, 69.0, 150.0, 295.0, 3270.0, 1022718.0, 20998.0, 417.0, 173.0, 85.0, 45.0, 37.0, 22.0, 21.0, 18.0, 13.0, 12.0, 9.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009512901306152344, -0.0009221509099006653, -0.0008930116891860962, -0.0008638724684715271, -0.000834733247756958, -0.0008055940270423889, -0.0007764548063278198, -0.0007473155856132507, -0.0007181763648986816, -0.0006890371441841125, -0.0006598979234695435, -0.0006307587027549744, -0.0006016194820404053, -0.0005724802613258362, -0.0005433410406112671, -0.000514201819896698, -0.0004850625991821289, -0.0004559233784675598, -0.0004267841577529907, -0.00039764493703842163, -0.00036850571632385254, -0.00033936649560928345, -0.00031022727489471436, -0.00028108805418014526, -0.00025194883346557617, -0.00022280961275100708, -0.000193670392036438, -0.0001645311713218689, -0.0001353919506072998, -0.00010625272989273071, -7.711350917816162e-05, -4.797428846359253e-05, -1.8835067749023438e-05, 1.0304152965545654e-05, 3.9443373680114746e-05, 6.858259439468384e-05, 9.772181510925293e-05, 0.00012686103582382202, 0.0001560002565383911, 0.0001851394772529602, 0.0002142786979675293, 0.0002434179186820984, 0.0002725571393966675, 0.00030169636011123657, 0.00033083558082580566, 0.00035997480154037476, 0.00038911402225494385, 0.00041825324296951294, 0.00044739246368408203, 0.0004765316843986511, 0.0005056709051132202, 0.0005348101258277893, 0.0005639493465423584, 0.0005930885672569275, 0.0006222277879714966, 0.0006513670086860657, 0.0006805062294006348, 0.0007096454501152039, 0.000738784670829773, 0.000767923891544342, 0.0007970631122589111, 0.0008262023329734802, 0.0008553415536880493, 0.0008844807744026184, 0.0009136199951171875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 9.0, 25.0, 45.0, 79.0, 121.0, 183.0, 182.0, 146.0, 89.0, 54.0, 23.0, 24.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5303618056350388e-05, -1.4302251656772569e-05, -1.330088525719475e-05, -1.2299518857616931e-05, -1.1298152458039112e-05, -1.0296786058461294e-05, -9.295418749388773e-06, -8.294052349810954e-06, -7.292685950233135e-06, -6.2913195506553166e-06, -5.289953151077498e-06, -4.288586296752328e-06, -3.2872198971745092e-06, -2.2858534975966904e-06, -1.2844866432715207e-06, -2.831202436937019e-07, 7.182461558841169e-07, 1.7196126691487734e-06, 2.72097918241343e-06, 3.722345809364924e-06, 4.723712208942743e-06, 5.725078608520562e-06, 6.7264454628457315e-06, 7.72781186242355e-06, 8.729178262001369e-06, 9.730544661579188e-06, 1.0731911061157007e-05, 1.1733278370229527e-05, 1.2734644769807346e-05, 1.3736011169385165e-05, 1.4737377568962984e-05, 1.5738743968540803e-05, 1.6740112187108025e-05, 1.7741478586685844e-05, 1.8742844986263663e-05, 1.974421138584148e-05, 2.07455777854193e-05, 2.174694418499712e-05, 2.2748310584574938e-05, 2.374967880314216e-05, 2.4751043383730575e-05, 2.5752409783308394e-05, 2.6753776182886213e-05, 2.7755142582464032e-05, 2.875650898204185e-05, 2.975787538161967e-05, 3.075924178119749e-05, 3.176060999976471e-05, 3.276197821833193e-05, 3.3763346436899155e-05, 3.476471101748757e-05, 3.576607923605479e-05, 3.676744381664321e-05, 3.776881203521043e-05, 3.8770176615798846e-05, 3.977154483436607e-05, 4.0772909414954484e-05, 4.1774277633521706e-05, 4.277564221411012e-05, 4.3777010432677343e-05, 4.477837501326576e-05, 4.577974323183298e-05, 4.6781107812421396e-05, 4.778247603098862e-05, 4.8783840611577034e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 3.0, 5.0, 7.0, 5.0, 12.0, 9.0, 18.0, 13.0, 26.0, 11.0, 24.0, 21.0, 27.0, 30.0, 32.0, 30.0, 30.0, 27.0, 34.0, 41.0, 25.0, 40.0, 35.0, 42.0, 43.0, 43.0, 31.0, 38.0, 35.0, 41.0, 27.0, 40.0, 24.0, 30.0, 15.0, 18.0, 8.0, 13.0, 8.0, 15.0, 5.0, 6.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.627206802368164e-05, -1.5766359865665436e-05, -1.526065170764923e-05, -1.4754943549633026e-05, -1.4249235391616821e-05, -1.3743527233600616e-05, -1.3237819075584412e-05, -1.2732110917568207e-05, -1.2226402759552002e-05, -1.1720694601535797e-05, -1.1214986443519592e-05, -1.0709278285503387e-05, -1.0203570127487183e-05, -9.697861969470978e-06, -9.192153811454773e-06, -8.686445653438568e-06, -8.180737495422363e-06, -7.675029337406158e-06, -7.169321179389954e-06, -6.663613021373749e-06, -6.157904863357544e-06, -5.652196705341339e-06, -5.146488547325134e-06, -4.6407803893089294e-06, -4.135072231292725e-06, -3.6293640732765198e-06, -3.123655915260315e-06, -2.61794775724411e-06, -2.1122395992279053e-06, -1.6065314412117004e-06, -1.1008232831954956e-06, -5.951151251792908e-07, -8.940696716308594e-08, 4.163011908531189e-07, 9.220093488693237e-07, 1.4277175068855286e-06, 1.9334256649017334e-06, 2.4391338229179382e-06, 2.944841980934143e-06, 3.450550138950348e-06, 3.956258296966553e-06, 4.4619664549827576e-06, 4.967674612998962e-06, 5.473382771015167e-06, 5.979090929031372e-06, 6.484799087047577e-06, 6.990507245063782e-06, 7.4962154030799866e-06, 8.001923561096191e-06, 8.507631719112396e-06, 9.013339877128601e-06, 9.519048035144806e-06, 1.002475619316101e-05, 1.0530464351177216e-05, 1.103617250919342e-05, 1.1541880667209625e-05, 1.204758882522583e-05, 1.2553296983242035e-05, 1.305900514125824e-05, 1.3564713299274445e-05, 1.407042145729065e-05, 1.4576129615306854e-05, 1.5081837773323059e-05, 1.5587545931339264e-05, 1.609325408935547e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 10.0, 12.0, 23.0, 15.0, 17.0, 27.0, 19.0, 31.0, 30.0, 27.0, 49.0, 43.0, 49.0, 25.0, 52.0, 45.0, 41.0, 47.0, 47.0, 32.0, 41.0, 33.0, 28.0, 26.0, 33.0, 21.0, 28.0, 14.0, 13.0, 14.0, 17.0, 11.0, 8.0, 5.0, 7.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27203369140625, -4.1300048828125, -3.98797607421875, -3.845947265625, -3.70391845703125, -3.5618896484375, -3.41986083984375, -3.27783203125, -3.13580322265625, -2.9937744140625, -2.85174560546875, -2.709716796875, -2.56768798828125, -2.4256591796875, -2.28363037109375, -2.1416015625, -1.99957275390625, -1.8575439453125, -1.71551513671875, -1.573486328125, -1.43145751953125, -1.2894287109375, -1.14739990234375, -1.00537109375, -0.86334228515625, -0.7213134765625, -0.57928466796875, -0.437255859375, -0.29522705078125, -0.1531982421875, -0.01116943359375, 0.130859375, 0.27288818359375, 0.4149169921875, 0.55694580078125, 0.698974609375, 0.84100341796875, 0.9830322265625, 1.12506103515625, 1.26708984375, 1.40911865234375, 1.5511474609375, 1.69317626953125, 1.835205078125, 1.97723388671875, 2.1192626953125, 2.26129150390625, 2.4033203125, 2.54534912109375, 2.6873779296875, 2.82940673828125, 2.971435546875, 3.11346435546875, 3.2554931640625, 3.39752197265625, 3.53955078125, 3.68157958984375, 3.8236083984375, 3.96563720703125, 4.107666015625, 4.24969482421875, 4.3917236328125, 4.53375244140625, 4.67578125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 10.0, 13.0, 14.0, 24.0, 34.0, 52.0, 51.0, 79.0, 93.0, 167.0, 289.0, 474.0, 721.0, 1232.0, 2342.0, 4140.0, 7714.0, 14577.0, 28853.0, 63879.0, 236896.0, 515423.0, 92702.0, 38262.0, 18704.0, 9642.0, 5314.0, 2788.0, 1613.0, 932.0, 515.0, 355.0, 189.0, 120.0, 78.0, 61.0, 45.0, 28.0, 21.0, 17.0, 13.0, 11.0, 11.0, 16.0, 8.0, 4.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.0703125, -6.8436279296875, -6.616943359375, -6.3902587890625, -6.16357421875, -5.9368896484375, -5.710205078125, -5.4835205078125, -5.2568359375, -5.0301513671875, -4.803466796875, -4.5767822265625, -4.35009765625, -4.1234130859375, -3.896728515625, -3.6700439453125, -3.443359375, -3.2166748046875, -2.989990234375, -2.7633056640625, -2.53662109375, -2.3099365234375, -2.083251953125, -1.8565673828125, -1.6298828125, -1.4031982421875, -1.176513671875, -0.9498291015625, -0.72314453125, -0.4964599609375, -0.269775390625, -0.0430908203125, 0.18359375, 0.4102783203125, 0.636962890625, 0.8636474609375, 1.09033203125, 1.3170166015625, 1.543701171875, 1.7703857421875, 1.9970703125, 2.2237548828125, 2.450439453125, 2.6771240234375, 2.90380859375, 3.1304931640625, 3.357177734375, 3.5838623046875, 3.810546875, 4.0372314453125, 4.263916015625, 4.4906005859375, 4.71728515625, 4.9439697265625, 5.170654296875, 5.3973388671875, 5.6240234375, 5.8507080078125, 6.077392578125, 6.3040771484375, 6.53076171875, 6.7574462890625, 6.984130859375, 7.2108154296875, 7.4375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 0.0, 3.0, 6.0, 7.0, 3.0, 11.0, 10.0, 11.0, 6.0, 12.0, 10.0, 12.0, 22.0, 23.0, 22.0, 31.0, 37.0, 32.0, 38.0, 25.0, 43.0, 64.0, 53.0, 88.0, 257.0, 1598.0, 116.0, 73.0, 52.0, 48.0, 37.0, 36.0, 31.0, 35.0, 27.0, 23.0, 25.0, 20.0, 15.0, 19.0, 9.0, 5.0, 10.0, 10.0, 10.0, 12.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.46875, -12.0699462890625, -11.671142578125, -11.2723388671875, -10.87353515625, -10.4747314453125, -10.075927734375, -9.6771240234375, -9.2783203125, -8.8795166015625, -8.480712890625, -8.0819091796875, -7.68310546875, -7.2843017578125, -6.885498046875, -6.4866943359375, -6.087890625, -5.6890869140625, -5.290283203125, -4.8914794921875, -4.49267578125, -4.0938720703125, -3.695068359375, -3.2962646484375, -2.8974609375, -2.4986572265625, -2.099853515625, -1.7010498046875, -1.30224609375, -0.9034423828125, -0.504638671875, -0.1058349609375, 0.29296875, 0.6917724609375, 1.090576171875, 1.4893798828125, 1.88818359375, 2.2869873046875, 2.685791015625, 3.0845947265625, 3.4833984375, 3.8822021484375, 4.281005859375, 4.6798095703125, 5.07861328125, 5.4774169921875, 5.876220703125, 6.2750244140625, 6.673828125, 7.0726318359375, 7.471435546875, 7.8702392578125, 8.26904296875, 8.6678466796875, 9.066650390625, 9.4654541015625, 9.8642578125, 10.2630615234375, 10.661865234375, 11.0606689453125, 11.45947265625, 11.8582763671875, 12.257080078125, 12.6558837890625, 13.0546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 6.0, 14.0, 17.0, 13.0, 17.0, 24.0, 34.0, 46.0, 75.0, 118.0, 185.0, 355.0, 672.0, 1352.0, 3065.0, 7889.0, 29713.0, 243768.0, 2752370.0, 80125.0, 16279.0, 5182.0, 2110.0, 956.0, 518.0, 291.0, 136.0, 92.0, 75.0, 51.0, 35.0, 25.0, 16.0, 15.0, 11.0, 14.0, 8.0, 7.0, 4.0, 2.0, 7.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.953125, -20.21240234375, -19.4716796875, -18.73095703125, -17.990234375, -17.24951171875, -16.5087890625, -15.76806640625, -15.02734375, -14.28662109375, -13.5458984375, -12.80517578125, -12.064453125, -11.32373046875, -10.5830078125, -9.84228515625, -9.1015625, -8.36083984375, -7.6201171875, -6.87939453125, -6.138671875, -5.39794921875, -4.6572265625, -3.91650390625, -3.17578125, -2.43505859375, -1.6943359375, -0.95361328125, -0.212890625, 0.52783203125, 1.2685546875, 2.00927734375, 2.75, 3.49072265625, 4.2314453125, 4.97216796875, 5.712890625, 6.45361328125, 7.1943359375, 7.93505859375, 8.67578125, 9.41650390625, 10.1572265625, 10.89794921875, 11.638671875, 12.37939453125, 13.1201171875, 13.86083984375, 14.6015625, 15.34228515625, 16.0830078125, 16.82373046875, 17.564453125, 18.30517578125, 19.0458984375, 19.78662109375, 20.52734375, 21.26806640625, 22.0087890625, 22.74951171875, 23.490234375, 24.23095703125, 24.9716796875, 25.71240234375, 26.453125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 46.0, 103.0, 289.0, 277.0, 186.0, 74.0, 21.0, 8.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-147.24755859375, -144.53195190429688, -141.81634521484375, -139.10073852539062, -136.3851318359375, -133.6695098876953, -130.9539031982422, -128.23829650878906, -125.52268981933594, -122.80708312988281, -120.09147644042969, -117.37586212158203, -114.6602554321289, -111.94464874267578, -109.22904205322266, -106.513427734375, -103.79782104492188, -101.08221435546875, -98.36660766601562, -95.65099334716797, -92.93538665771484, -90.21977996826172, -87.5041732788086, -84.78855895996094, -82.07295989990234, -79.35735321044922, -76.6417465209961, -73.92613220214844, -71.21052551269531, -68.49491882324219, -65.77931213378906, -63.06370162963867, -60.34809494018555, -57.63248825073242, -54.91687774658203, -52.201271057128906, -49.485660552978516, -46.77005386352539, -44.054443359375, -41.338836669921875, -38.62322998046875, -35.907623291015625, -33.192012786865234, -30.47640609741211, -27.76079559326172, -25.045188903808594, -22.329580307006836, -19.613971710205078, -16.898361206054688, -14.18275260925293, -11.467144012451172, -8.75153636932373, -6.035927772521973, -3.320319175720215, -0.6047115325927734, 2.1108970642089844, 4.826505661010742, 7.5421142578125, 10.257722854614258, 12.9733304977417, 15.688939094543457, 18.40454864501953, 21.120155334472656, 23.835763931274414, 26.551372528076172]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 8.0, 6.0, 3.0, 11.0, 14.0, 18.0, 13.0, 22.0, 22.0, 22.0, 30.0, 29.0, 41.0, 32.0, 35.0, 40.0, 39.0, 40.0, 38.0, 40.0, 37.0, 46.0, 35.0, 40.0, 48.0, 32.0, 29.0, 24.0, 26.0, 34.0, 21.0, 21.0, 14.0, 16.0, 15.0, 9.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0], "bins": [-42.612205505371094, -41.43217849731445, -40.25215148925781, -39.072120666503906, -37.892093658447266, -36.712066650390625, -35.532039642333984, -34.352012634277344, -33.1719856262207, -31.991958618164062, -30.81192970275879, -29.63190269470215, -28.451875686645508, -27.271846771240234, -26.091819763183594, -24.911792755126953, -23.73176383972168, -22.55173683166504, -21.371707916259766, -20.191680908203125, -19.011653900146484, -17.831626892089844, -16.65159797668457, -15.47157096862793, -14.291543006896973, -13.111515045166016, -11.931488037109375, -10.751460075378418, -9.571432113647461, -8.39140510559082, -7.211377143859863, -6.031350135803223, -4.851322174072266, -3.671294689178467, -2.491266965866089, -1.311239242553711, -0.1312117576599121, 1.0488157272338867, 2.2288436889648438, 3.4088706970214844, 4.588898658752441, 5.76892614364624, 6.948953628540039, 8.128981590270996, 9.309009552001953, 10.489036560058594, 11.66906452178955, 12.849091529846191, 14.029119491577148, 15.209147453308105, 16.389175415039062, 17.569202423095703, 18.749229431152344, 19.929256439208984, 21.109285354614258, 22.2893123626709, 23.469341278076172, 24.649368286132812, 25.829397201538086, 27.009424209594727, 28.189451217651367, 29.36948013305664, 30.54950714111328, 31.729534149169922, 32.90956115722656]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 12.0, 9.0, 14.0, 13.0, 19.0, 18.0, 19.0, 29.0, 32.0, 23.0, 33.0, 30.0, 31.0, 38.0, 39.0, 59.0, 46.0, 40.0, 42.0, 37.0, 39.0, 44.0, 29.0, 46.0, 29.0, 35.0, 29.0, 23.0, 21.0, 18.0, 11.0, 19.0, 12.0, 8.0, 10.0, 7.0, 4.0, 9.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.7833251953125, -4.633056640625, -4.4827880859375, -4.33251953125, -4.1822509765625, -4.031982421875, -3.8817138671875, -3.7314453125, -3.5811767578125, -3.430908203125, -3.2806396484375, -3.13037109375, -2.9801025390625, -2.829833984375, -2.6795654296875, -2.529296875, -2.3790283203125, -2.228759765625, -2.0784912109375, -1.92822265625, -1.7779541015625, -1.627685546875, -1.4774169921875, -1.3271484375, -1.1768798828125, -1.026611328125, -0.8763427734375, -0.72607421875, -0.5758056640625, -0.425537109375, -0.2752685546875, -0.125, 0.0252685546875, 0.175537109375, 0.3258056640625, 0.47607421875, 0.6263427734375, 0.776611328125, 0.9268798828125, 1.0771484375, 1.2274169921875, 1.377685546875, 1.5279541015625, 1.67822265625, 1.8284912109375, 1.978759765625, 2.1290283203125, 2.279296875, 2.4295654296875, 2.579833984375, 2.7301025390625, 2.88037109375, 3.0306396484375, 3.180908203125, 3.3311767578125, 3.4814453125, 3.6317138671875, 3.781982421875, 3.9322509765625, 4.08251953125, 4.2327880859375, 4.383056640625, 4.5333251953125, 4.68359375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 18.0, 20.0, 30.0, 45.0, 59.0, 96.0, 114.0, 161.0, 282.0, 363.0, 500.0, 762.0, 1128.0, 1799.0, 2958.0, 4909.0, 8857.0, 17635.0, 37088.0, 90409.0, 274687.0, 1084192.0, 1859839.0, 540530.0, 154791.0, 58526.0, 25569.0, 12333.0, 6594.0, 3769.0, 2240.0, 1397.0, 853.0, 516.0, 388.0, 264.0, 166.0, 111.0, 79.0, 62.0, 49.0, 29.0, 20.0, 13.0, 6.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-7.25, -7.031982421875, -6.81396484375, -6.595947265625, -6.3779296875, -6.159912109375, -5.94189453125, -5.723876953125, -5.505859375, -5.287841796875, -5.06982421875, -4.851806640625, -4.6337890625, -4.415771484375, -4.19775390625, -3.979736328125, -3.76171875, -3.543701171875, -3.32568359375, -3.107666015625, -2.8896484375, -2.671630859375, -2.45361328125, -2.235595703125, -2.017578125, -1.799560546875, -1.58154296875, -1.363525390625, -1.1455078125, -0.927490234375, -0.70947265625, -0.491455078125, -0.2734375, -0.055419921875, 0.16259765625, 0.380615234375, 0.5986328125, 0.816650390625, 1.03466796875, 1.252685546875, 1.470703125, 1.688720703125, 1.90673828125, 2.124755859375, 2.3427734375, 2.560791015625, 2.77880859375, 2.996826171875, 3.21484375, 3.432861328125, 3.65087890625, 3.868896484375, 4.0869140625, 4.304931640625, 4.52294921875, 4.740966796875, 4.958984375, 5.177001953125, 5.39501953125, 5.613037109375, 5.8310546875, 6.049072265625, 6.26708984375, 6.485107421875, 6.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 12.0, 9.0, 5.0, 10.0, 20.0, 25.0, 38.0, 34.0, 37.0, 62.0, 88.0, 113.0, 129.0, 211.0, 240.0, 325.0, 441.0, 504.0, 442.0, 327.0, 261.0, 171.0, 134.0, 94.0, 84.0, 58.0, 47.0, 31.0, 25.0, 19.0, 15.0, 11.0, 10.0, 5.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.171875, -6.9364013671875, -6.700927734375, -6.4654541015625, -6.22998046875, -5.9945068359375, -5.759033203125, -5.5235595703125, -5.2880859375, -5.0526123046875, -4.817138671875, -4.5816650390625, -4.34619140625, -4.1107177734375, -3.875244140625, -3.6397705078125, -3.404296875, -3.1688232421875, -2.933349609375, -2.6978759765625, -2.46240234375, -2.2269287109375, -1.991455078125, -1.7559814453125, -1.5205078125, -1.2850341796875, -1.049560546875, -0.8140869140625, -0.57861328125, -0.3431396484375, -0.107666015625, 0.1278076171875, 0.36328125, 0.5987548828125, 0.834228515625, 1.0697021484375, 1.30517578125, 1.5406494140625, 1.776123046875, 2.0115966796875, 2.2470703125, 2.4825439453125, 2.718017578125, 2.9534912109375, 3.18896484375, 3.4244384765625, 3.659912109375, 3.8953857421875, 4.130859375, 4.3663330078125, 4.601806640625, 4.8372802734375, 5.07275390625, 5.3082275390625, 5.543701171875, 5.7791748046875, 6.0146484375, 6.2501220703125, 6.485595703125, 6.7210693359375, 6.95654296875, 7.1920166015625, 7.427490234375, 7.6629638671875, 7.8984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 8.0, 8.0, 10.0, 15.0, 13.0, 34.0, 33.0, 49.0, 66.0, 129.0, 220.0, 428.0, 1111.0, 4110.0, 22162.0, 214741.0, 3276157.0, 619073.0, 45732.0, 7110.0, 1735.0, 579.0, 263.0, 148.0, 92.0, 66.0, 54.0, 29.0, 19.0, 24.0, 16.0, 10.0, 7.0, 5.0, 8.0, 3.0, 10.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.34375, -26.577392578125, -25.81103515625, -25.044677734375, -24.2783203125, -23.511962890625, -22.74560546875, -21.979248046875, -21.212890625, -20.446533203125, -19.68017578125, -18.913818359375, -18.1474609375, -17.381103515625, -16.61474609375, -15.848388671875, -15.08203125, -14.315673828125, -13.54931640625, -12.782958984375, -12.0166015625, -11.250244140625, -10.48388671875, -9.717529296875, -8.951171875, -8.184814453125, -7.41845703125, -6.652099609375, -5.8857421875, -5.119384765625, -4.35302734375, -3.586669921875, -2.8203125, -2.053955078125, -1.28759765625, -0.521240234375, 0.2451171875, 1.011474609375, 1.77783203125, 2.544189453125, 3.310546875, 4.076904296875, 4.84326171875, 5.609619140625, 6.3759765625, 7.142333984375, 7.90869140625, 8.675048828125, 9.44140625, 10.207763671875, 10.97412109375, 11.740478515625, 12.5068359375, 13.273193359375, 14.03955078125, 14.805908203125, 15.572265625, 16.338623046875, 17.10498046875, 17.871337890625, 18.6376953125, 19.404052734375, 20.17041015625, 20.936767578125, 21.703125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 19.0, 30.0, 50.0, 67.0, 91.0, 124.0, 119.0, 100.0, 107.0, 84.0, 77.0, 48.0, 44.0, 10.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.79399871826172, -58.372676849365234, -56.95135498046875, -55.530029296875, -54.108707427978516, -52.68738555908203, -51.26606369018555, -49.84474182128906, -48.42341995239258, -47.002098083496094, -45.58077621459961, -44.159454345703125, -42.738128662109375, -41.31680679321289, -39.895484924316406, -38.47416305541992, -37.05284118652344, -35.63151931762695, -34.21019744873047, -32.78887176513672, -31.367551803588867, -29.94622802734375, -28.524906158447266, -27.10358428955078, -25.68225860595703, -24.260936737060547, -22.83961296081543, -21.418291091918945, -19.99696922302246, -18.575645446777344, -17.15432357788086, -15.733001708984375, -14.311681747436523, -12.890358924865723, -11.469037055969238, -10.047714233398438, -8.626392364501953, -7.205069541931152, -5.783746719360352, -4.362424850463867, -2.9411020278930664, -1.5197795629501343, -0.09845709800720215, 1.3228654861450195, 2.744187831878662, 4.165510177612305, 5.5868330001831055, 7.00815486907959, 8.42947769165039, 9.850800514221191, 11.272122383117676, 12.693445205688477, 14.114767074584961, 15.536089897155762, 16.957412719726562, 18.378734588623047, 19.80005645751953, 21.221378326416016, 22.642702102661133, 24.064023971557617, 25.4853458404541, 26.90666961669922, 28.327991485595703, 29.749313354492188, 31.170637130737305]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 10.0, 7.0, 7.0, 11.0, 12.0, 17.0, 19.0, 16.0, 23.0, 25.0, 18.0, 21.0, 24.0, 29.0, 34.0, 46.0, 37.0, 41.0, 32.0, 43.0, 46.0, 42.0, 37.0, 43.0, 40.0, 57.0, 33.0, 37.0, 26.0, 19.0, 25.0, 18.0, 21.0, 16.0, 10.0, 15.0, 6.0, 7.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.317338943481445, -30.392759323120117, -29.468177795410156, -28.543598175048828, -27.6190185546875, -26.69443702697754, -25.76985740661621, -24.84527587890625, -23.920696258544922, -22.996116638183594, -22.071535110473633, -21.146955490112305, -20.222373962402344, -19.297794342041016, -18.373214721679688, -17.44863510131836, -16.5240535736084, -15.599472999572754, -14.67489242553711, -13.750312805175781, -12.825732231140137, -11.901151657104492, -10.976572036743164, -10.05199146270752, -9.127410888671875, -8.20283031463623, -7.278250217437744, -6.353670120239258, -5.429089546203613, -4.504508972167969, -3.5799288749694824, -2.655348777770996, -1.7307662963867188, -0.8061859607696533, 0.11839437484741211, 1.0429747104644775, 1.967555046081543, 2.8921356201171875, 3.816715717315674, 4.74129581451416, 5.665876388549805, 6.590456962585449, 7.5150370597839355, 8.439617156982422, 9.364197731018066, 10.288778305053711, 11.213357925415039, 12.137938499450684, 13.062519073486328, 13.987099647521973, 14.911680221557617, 15.836259841918945, 16.760841369628906, 17.685420989990234, 18.610000610351562, 19.53458023071289, 20.45916175842285, 21.38374137878418, 22.30832290649414, 23.23290252685547, 24.157482147216797, 25.082063674926758, 26.006643295288086, 26.931224822998047, 27.855804443359375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 16.0, 8.0, 8.0, 19.0, 18.0, 11.0, 18.0, 15.0, 21.0, 25.0, 32.0, 23.0, 24.0, 33.0, 34.0, 42.0, 40.0, 33.0, 39.0, 44.0, 33.0, 33.0, 49.0, 39.0, 33.0, 36.0, 35.0, 20.0, 25.0, 25.0, 15.0, 21.0, 18.0, 20.0, 9.0, 12.0, 5.0, 13.0, 9.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.109375, -3.970947265625, -3.83251953125, -3.694091796875, -3.5556640625, -3.417236328125, -3.27880859375, -3.140380859375, -3.001953125, -2.863525390625, -2.72509765625, -2.586669921875, -2.4482421875, -2.309814453125, -2.17138671875, -2.032958984375, -1.89453125, -1.756103515625, -1.61767578125, -1.479248046875, -1.3408203125, -1.202392578125, -1.06396484375, -0.925537109375, -0.787109375, -0.648681640625, -0.51025390625, -0.371826171875, -0.2333984375, -0.094970703125, 0.04345703125, 0.181884765625, 0.3203125, 0.458740234375, 0.59716796875, 0.735595703125, 0.8740234375, 1.012451171875, 1.15087890625, 1.289306640625, 1.427734375, 1.566162109375, 1.70458984375, 1.843017578125, 1.9814453125, 2.119873046875, 2.25830078125, 2.396728515625, 2.53515625, 2.673583984375, 2.81201171875, 2.950439453125, 3.0888671875, 3.227294921875, 3.36572265625, 3.504150390625, 3.642578125, 3.781005859375, 3.91943359375, 4.057861328125, 4.1962890625, 4.334716796875, 4.47314453125, 4.611572265625, 4.75]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 2.0, 7.0, 11.0, 11.0, 21.0, 41.0, 42.0, 71.0, 115.0, 133.0, 212.0, 337.0, 472.0, 683.0, 1086.0, 1409.0, 2249.0, 3231.0, 4955.0, 7473.0, 11739.0, 18262.0, 30267.0, 52324.0, 97169.0, 218145.0, 319723.0, 120311.0, 62258.0, 35356.0, 21572.0, 13409.0, 8495.0, 5531.0, 3743.0, 2462.0, 1600.0, 1115.0, 784.0, 540.0, 368.0, 241.0, 209.0, 117.0, 77.0, 65.0, 47.0, 25.0, 12.0, 9.0, 12.0, 3.0, 0.0, 2.0, 1.0, 5.0], "bins": [-0.43994140625, -0.4270591735839844, -0.41417694091796875, -0.4012947082519531, -0.3884124755859375, -0.3755302429199219, -0.36264801025390625, -0.3497657775878906, -0.336883544921875, -0.3240013122558594, -0.31111907958984375, -0.2982368469238281, -0.2853546142578125, -0.2724723815917969, -0.25959014892578125, -0.24670791625976562, -0.23382568359375, -0.22094345092773438, -0.20806121826171875, -0.19517898559570312, -0.1822967529296875, -0.16941452026367188, -0.15653228759765625, -0.14365005493164062, -0.130767822265625, -0.11788558959960938, -0.10500335693359375, -0.09212112426757812, -0.0792388916015625, -0.06635665893554688, -0.05347442626953125, -0.040592193603515625, -0.0277099609375, -0.014827728271484375, -0.00194549560546875, 0.010936737060546875, 0.0238189697265625, 0.036701202392578125, 0.04958343505859375, 0.062465667724609375, 0.075347900390625, 0.08823013305664062, 0.10111236572265625, 0.11399459838867188, 0.1268768310546875, 0.13975906372070312, 0.15264129638671875, 0.16552352905273438, 0.17840576171875, 0.19128799438476562, 0.20417022705078125, 0.21705245971679688, 0.2299346923828125, 0.24281692504882812, 0.25569915771484375, 0.2685813903808594, 0.281463623046875, 0.2943458557128906, 0.30722808837890625, 0.3201103210449219, 0.3329925537109375, 0.3458747863769531, 0.35875701904296875, 0.3716392517089844, 0.384521484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 10.0, 10.0, 4.0, 5.0, 13.0, 14.0, 19.0, 21.0, 25.0, 23.0, 20.0, 19.0, 29.0, 30.0, 20.0, 25.0, 31.0, 33.0, 30.0, 42.0, 46.0, 1074.0, 38.0, 37.0, 43.0, 31.0, 35.0, 36.0, 27.0, 24.0, 21.0, 17.0, 27.0, 23.0, 19.0, 18.0, 18.0, 16.0, 8.0, 9.0, 8.0, 8.0, 3.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.439453125, -3.33575439453125, -3.2320556640625, -3.12835693359375, -3.024658203125, -2.92095947265625, -2.8172607421875, -2.71356201171875, -2.60986328125, -2.50616455078125, -2.4024658203125, -2.29876708984375, -2.195068359375, -2.09136962890625, -1.9876708984375, -1.88397216796875, -1.7802734375, -1.67657470703125, -1.5728759765625, -1.46917724609375, -1.365478515625, -1.26177978515625, -1.1580810546875, -1.05438232421875, -0.95068359375, -0.84698486328125, -0.7432861328125, -0.63958740234375, -0.535888671875, -0.43218994140625, -0.3284912109375, -0.22479248046875, -0.12109375, -0.01739501953125, 0.0863037109375, 0.19000244140625, 0.293701171875, 0.39739990234375, 0.5010986328125, 0.60479736328125, 0.70849609375, 0.81219482421875, 0.9158935546875, 1.01959228515625, 1.123291015625, 1.22698974609375, 1.3306884765625, 1.43438720703125, 1.5380859375, 1.64178466796875, 1.7454833984375, 1.84918212890625, 1.952880859375, 2.05657958984375, 2.1602783203125, 2.26397705078125, 2.36767578125, 2.47137451171875, 2.5750732421875, 2.67877197265625, 2.782470703125, 2.88616943359375, 2.9898681640625, 3.09356689453125, 3.197265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 10.0, 16.0, 33.0, 42.0, 42.0, 58.0, 138.0, 175.0, 234.0, 338.0, 528.0, 766.0, 1064.0, 1705.0, 2411.0, 3605.0, 5629.0, 8473.0, 12721.0, 20260.0, 32168.0, 54009.0, 97113.0, 251444.0, 1348436.0, 104252.0, 56727.0, 33789.0, 21268.0, 13528.0, 8777.0, 5751.0, 3771.0, 2551.0, 1669.0, 1142.0, 802.0, 520.0, 376.0, 228.0, 171.0, 128.0, 63.0, 67.0, 43.0, 34.0, 15.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.215576171875, -0.2086334228515625, -0.201690673828125, -0.1947479248046875, -0.18780517578125, -0.1808624267578125, -0.173919677734375, -0.1669769287109375, -0.1600341796875, -0.1530914306640625, -0.146148681640625, -0.1392059326171875, -0.13226318359375, -0.1253204345703125, -0.118377685546875, -0.1114349365234375, -0.1044921875, -0.0975494384765625, -0.090606689453125, -0.0836639404296875, -0.07672119140625, -0.0697784423828125, -0.062835693359375, -0.0558929443359375, -0.0489501953125, -0.0420074462890625, -0.035064697265625, -0.0281219482421875, -0.02117919921875, -0.0142364501953125, -0.007293701171875, -0.0003509521484375, 0.006591796875, 0.0135345458984375, 0.020477294921875, 0.0274200439453125, 0.03436279296875, 0.0413055419921875, 0.048248291015625, 0.0551910400390625, 0.0621337890625, 0.0690765380859375, 0.076019287109375, 0.0829620361328125, 0.08990478515625, 0.0968475341796875, 0.103790283203125, 0.1107330322265625, 0.11767578125, 0.1246185302734375, 0.131561279296875, 0.1385040283203125, 0.14544677734375, 0.1523895263671875, 0.159332275390625, 0.1662750244140625, 0.1732177734375, 0.1801605224609375, 0.187103271484375, 0.1940460205078125, 0.20098876953125, 0.2079315185546875, 0.214874267578125, 0.2218170166015625, 0.228759765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 13.0, 17.0, 25.0, 29.0, 29.0, 45.0, 61.0, 81.0, 94.0, 169.0, 96.0, 83.0, 59.0, 47.0, 46.0, 32.0, 19.0, 17.0, 8.0, 13.0, 0.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45246696472168e-05, -4.290509968996048e-05, -4.128552973270416e-05, -3.9665959775447845e-05, -3.804638981819153e-05, -3.642681986093521e-05, -3.4807249903678894e-05, -3.318767994642258e-05, -3.156810998916626e-05, -2.9948540031909943e-05, -2.8328970074653625e-05, -2.670940011739731e-05, -2.508983016014099e-05, -2.3470260202884674e-05, -2.1850690245628357e-05, -2.023112028837204e-05, -1.8611550331115723e-05, -1.6991980373859406e-05, -1.537241041660309e-05, -1.3752840459346771e-05, -1.2133270502090454e-05, -1.0513700544834137e-05, -8.89413058757782e-06, -7.274560630321503e-06, -5.6549906730651855e-06, -4.035420715808868e-06, -2.4158507585525513e-06, -7.962808012962341e-07, 8.23289155960083e-07, 2.4428591132164e-06, 4.062429070472717e-06, 5.6819990277290344e-06, 7.3015689849853516e-06, 8.921138942241669e-06, 1.0540708899497986e-05, 1.2160278856754303e-05, 1.377984881401062e-05, 1.5399418771266937e-05, 1.7018988728523254e-05, 1.863855868577957e-05, 2.025812864303589e-05, 2.1877698600292206e-05, 2.3497268557548523e-05, 2.511683851480484e-05, 2.6736408472061157e-05, 2.8355978429317474e-05, 2.997554838657379e-05, 3.159511834383011e-05, 3.3214688301086426e-05, 3.483425825834274e-05, 3.645382821559906e-05, 3.807339817285538e-05, 3.9692968130111694e-05, 4.131253808736801e-05, 4.293210804462433e-05, 4.4551678001880646e-05, 4.617124795913696e-05, 4.779081791639328e-05, 4.94103878736496e-05, 5.1029957830905914e-05, 5.264952778816223e-05, 5.426909774541855e-05, 5.5888667702674866e-05, 5.750823765993118e-05, 5.91278076171875e-05]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 12.0, 9.0, 29.0, 35.0, 49.0, 66.0, 117.0, 242.0, 2682.0, 1038790.0, 5894.0, 297.0, 107.0, 70.0, 39.0, 30.0, 28.0, 17.0, 15.0, 4.0, 4.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014944076538085938, -0.0014535337686538696, -0.0014126598834991455, -0.0013717859983444214, -0.0013309121131896973, -0.0012900382280349731, -0.001249164342880249, -0.001208290457725525, -0.0011674165725708008, -0.0011265426874160767, -0.0010856688022613525, -0.0010447949171066284, -0.0010039210319519043, -0.0009630471467971802, -0.0009221732616424561, -0.0008812993764877319, -0.0008404254913330078, -0.0007995516061782837, -0.0007586777210235596, -0.0007178038358688354, -0.0006769299507141113, -0.0006360560655593872, -0.0005951821804046631, -0.000554308295249939, -0.0005134344100952148, -0.0004725605249404907, -0.0004316866397857666, -0.0003908127546310425, -0.00034993886947631836, -0.00030906498432159424, -0.0002681910991668701, -0.000227317214012146, -0.00018644332885742188, -0.00014556944370269775, -0.00010469555854797363, -6.382167339324951e-05, -2.294778823852539e-05, 1.792609691619873e-05, 5.879998207092285e-05, 9.967386722564697e-05, 0.0001405477523803711, 0.00018142163753509521, 0.00022229552268981934, 0.00026316940784454346, 0.0003040432929992676, 0.0003449171781539917, 0.0003857910633087158, 0.00042666494846343994, 0.00046753883361816406, 0.0005084127187728882, 0.0005492866039276123, 0.0005901604890823364, 0.0006310343742370605, 0.0006719082593917847, 0.0007127821445465088, 0.0007536560297012329, 0.000794529914855957, 0.0008354038000106812, 0.0008762776851654053, 0.0009171515703201294, 0.0009580254554748535, 0.0009988993406295776, 0.0010397732257843018, 0.0010806471109390259, 0.00112152099609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 16.0, 30.0, 60.0, 133.0, 229.0, 222.0, 161.0, 74.0, 28.0, 16.0, 16.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53208849648945e-05, -4.39509931311477e-05, -4.258110129740089e-05, -4.1211209463654086e-05, -3.984131762990728e-05, -3.8471425796160474e-05, -3.710153396241367e-05, -3.573164212866686e-05, -3.436175029492006e-05, -3.299185846117325e-05, -3.1621966627426445e-05, -3.025207479367964e-05, -2.8882182959932834e-05, -2.7512291126186028e-05, -2.6142399292439222e-05, -2.4772507458692417e-05, -2.340261562494561e-05, -2.2032723791198805e-05, -2.0662831957452e-05, -1.9292940123705193e-05, -1.7923048289958388e-05, -1.6553156456211582e-05, -1.5183264622464776e-05, -1.381337278871797e-05, -1.2443480954971164e-05, -1.1073589121224359e-05, -9.703697287477553e-06, -8.333805453730747e-06, -6.963913619983941e-06, -5.5940217862371355e-06, -4.22412995249033e-06, -2.854238118743524e-06, -1.484342647017911e-06, -1.1445081327110529e-07, 1.2554410204757005e-06, 2.6253328542225063e-06, 3.995224687969312e-06, 5.365116521716118e-06, 6.735008355462924e-06, 8.10490018920973e-06, 9.474792022956535e-06, 1.0844683856703341e-05, 1.2214575690450147e-05, 1.3584467524196953e-05, 1.4954359357943758e-05, 1.6324251191690564e-05, 1.769414302543737e-05, 1.9064034859184176e-05, 2.043392669293098e-05, 2.1803818526677787e-05, 2.3173710360424593e-05, 2.45436021941714e-05, 2.5913494027918205e-05, 2.728338586166501e-05, 2.8653277695411816e-05, 3.0023169529158622e-05, 3.139306136290543e-05, 3.2762953196652234e-05, 3.413284503039904e-05, 3.5502736864145845e-05, 3.687262869789265e-05, 3.824252053163946e-05, 3.961241236538626e-05, 4.098230419913307e-05, 4.2352196032879874e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 9.0, 5.0, 12.0, 8.0, 12.0, 9.0, 9.0, 14.0, 26.0, 20.0, 29.0, 30.0, 37.0, 29.0, 37.0, 41.0, 37.0, 38.0, 41.0, 49.0, 39.0, 37.0, 35.0, 39.0, 30.0, 52.0, 33.0, 27.0, 31.0, 32.0, 21.0, 31.0, 11.0, 10.0, 9.0, 9.0, 9.0, 7.0, 7.0, 10.0, 7.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.436471939086914e-05, -1.385621726512909e-05, -1.3347715139389038e-05, -1.2839213013648987e-05, -1.2330710887908936e-05, -1.1822208762168884e-05, -1.1313706636428833e-05, -1.0805204510688782e-05, -1.029670238494873e-05, -9.78820025920868e-06, -9.279698133468628e-06, -8.771196007728577e-06, -8.262693881988525e-06, -7.754191756248474e-06, -7.245689630508423e-06, -6.737187504768372e-06, -6.22868537902832e-06, -5.720183253288269e-06, -5.211681127548218e-06, -4.7031790018081665e-06, -4.194676876068115e-06, -3.686174750328064e-06, -3.1776726245880127e-06, -2.6691704988479614e-06, -2.16066837310791e-06, -1.6521662473678589e-06, -1.1436641216278076e-06, -6.351619958877563e-07, -1.2665987014770508e-07, 3.818422555923462e-07, 8.903443813323975e-07, 1.3988465070724487e-06, 1.9073486328125e-06, 2.4158507585525513e-06, 2.9243528842926025e-06, 3.432855010032654e-06, 3.941357135772705e-06, 4.449859261512756e-06, 4.958361387252808e-06, 5.466863512992859e-06, 5.97536563873291e-06, 6.4838677644729614e-06, 6.992369890213013e-06, 7.500872015953064e-06, 8.009374141693115e-06, 8.517876267433167e-06, 9.026378393173218e-06, 9.534880518913269e-06, 1.004338264465332e-05, 1.0551884770393372e-05, 1.1060386896133423e-05, 1.1568889021873474e-05, 1.2077391147613525e-05, 1.2585893273353577e-05, 1.3094395399093628e-05, 1.360289752483368e-05, 1.411139965057373e-05, 1.4619901776313782e-05, 1.5128403902053833e-05, 1.5636906027793884e-05, 1.6145408153533936e-05, 1.6653910279273987e-05, 1.7162412405014038e-05, 1.767091453075409e-05, 1.817941665649414e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 16.0, 8.0, 8.0, 19.0, 18.0, 11.0, 18.0, 15.0, 21.0, 25.0, 32.0, 23.0, 24.0, 33.0, 34.0, 42.0, 40.0, 33.0, 39.0, 44.0, 33.0, 33.0, 49.0, 39.0, 33.0, 36.0, 35.0, 20.0, 25.0, 25.0, 15.0, 21.0, 18.0, 20.0, 9.0, 12.0, 5.0, 13.0, 9.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.109375, -3.970947265625, -3.83251953125, -3.694091796875, -3.5556640625, -3.417236328125, -3.27880859375, -3.140380859375, -3.001953125, -2.863525390625, -2.72509765625, -2.586669921875, -2.4482421875, -2.309814453125, -2.17138671875, -2.032958984375, -1.89453125, -1.756103515625, -1.61767578125, -1.479248046875, -1.3408203125, -1.202392578125, -1.06396484375, -0.925537109375, -0.787109375, -0.648681640625, -0.51025390625, -0.371826171875, -0.2333984375, -0.094970703125, 0.04345703125, 0.181884765625, 0.3203125, 0.458740234375, 0.59716796875, 0.735595703125, 0.8740234375, 1.012451171875, 1.15087890625, 1.289306640625, 1.427734375, 1.566162109375, 1.70458984375, 1.843017578125, 1.9814453125, 2.119873046875, 2.25830078125, 2.396728515625, 2.53515625, 2.673583984375, 2.81201171875, 2.950439453125, 3.0888671875, 3.227294921875, 3.36572265625, 3.504150390625, 3.642578125, 3.781005859375, 3.91943359375, 4.057861328125, 4.1962890625, 4.334716796875, 4.47314453125, 4.611572265625, 4.75]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 6.0, 10.0, 21.0, 24.0, 40.0, 51.0, 87.0, 131.0, 179.0, 246.0, 361.0, 507.0, 777.0, 1178.0, 1679.0, 2386.0, 3486.0, 5248.0, 7927.0, 11599.0, 17114.0, 26059.0, 41493.0, 71491.0, 156500.0, 314054.0, 178084.0, 79011.0, 44585.0, 27897.0, 18476.0, 12127.0, 8124.0, 5636.0, 3857.0, 2544.0, 1790.0, 1232.0, 798.0, 526.0, 365.0, 275.0, 184.0, 134.0, 79.0, 60.0, 36.0, 26.0, 15.0, 10.0, 14.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.05859375, -4.89837646484375, -4.7381591796875, -4.57794189453125, -4.417724609375, -4.25750732421875, -4.0972900390625, -3.93707275390625, -3.77685546875, -3.61663818359375, -3.4564208984375, -3.29620361328125, -3.135986328125, -2.97576904296875, -2.8155517578125, -2.65533447265625, -2.4951171875, -2.33489990234375, -2.1746826171875, -2.01446533203125, -1.854248046875, -1.69403076171875, -1.5338134765625, -1.37359619140625, -1.21337890625, -1.05316162109375, -0.8929443359375, -0.73272705078125, -0.572509765625, -0.41229248046875, -0.2520751953125, -0.09185791015625, 0.068359375, 0.22857666015625, 0.3887939453125, 0.54901123046875, 0.709228515625, 0.86944580078125, 1.0296630859375, 1.18988037109375, 1.35009765625, 1.51031494140625, 1.6705322265625, 1.83074951171875, 1.990966796875, 2.15118408203125, 2.3114013671875, 2.47161865234375, 2.6318359375, 2.79205322265625, 2.9522705078125, 3.11248779296875, 3.272705078125, 3.43292236328125, 3.5931396484375, 3.75335693359375, 3.91357421875, 4.07379150390625, 4.2340087890625, 4.39422607421875, 4.554443359375, 4.71466064453125, 4.8748779296875, 5.03509521484375, 5.1953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 9.0, 5.0, 8.0, 11.0, 14.0, 23.0, 12.0, 27.0, 28.0, 16.0, 26.0, 49.0, 43.0, 43.0, 57.0, 80.0, 115.0, 182.0, 1352.0, 278.0, 168.0, 95.0, 62.0, 57.0, 39.0, 29.0, 33.0, 27.0, 22.0, 22.0, 21.0, 14.0, 16.0, 6.0, 6.0, 12.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.6171875, -14.158203125, -13.69921875, -13.240234375, -12.78125, -12.322265625, -11.86328125, -11.404296875, -10.9453125, -10.486328125, -10.02734375, -9.568359375, -9.109375, -8.650390625, -8.19140625, -7.732421875, -7.2734375, -6.814453125, -6.35546875, -5.896484375, -5.4375, -4.978515625, -4.51953125, -4.060546875, -3.6015625, -3.142578125, -2.68359375, -2.224609375, -1.765625, -1.306640625, -0.84765625, -0.388671875, 0.0703125, 0.529296875, 0.98828125, 1.447265625, 1.90625, 2.365234375, 2.82421875, 3.283203125, 3.7421875, 4.201171875, 4.66015625, 5.119140625, 5.578125, 6.037109375, 6.49609375, 6.955078125, 7.4140625, 7.873046875, 8.33203125, 8.791015625, 9.25, 9.708984375, 10.16796875, 10.626953125, 11.0859375, 11.544921875, 12.00390625, 12.462890625, 12.921875, 13.380859375, 13.83984375, 14.298828125, 14.7578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 5.0, 4.0, 6.0, 12.0, 13.0, 13.0, 18.0, 24.0, 39.0, 63.0, 75.0, 140.0, 235.0, 495.0, 1426.0, 5639.0, 26942.0, 191067.0, 2406303.0, 452525.0, 47833.0, 9187.0, 2221.0, 681.0, 261.0, 152.0, 98.0, 65.0, 52.0, 32.0, 22.0, 20.0, 13.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.578125, -20.016845703125, -19.45556640625, -18.894287109375, -18.3330078125, -17.771728515625, -17.21044921875, -16.649169921875, -16.087890625, -15.526611328125, -14.96533203125, -14.404052734375, -13.8427734375, -13.281494140625, -12.72021484375, -12.158935546875, -11.59765625, -11.036376953125, -10.47509765625, -9.913818359375, -9.3525390625, -8.791259765625, -8.22998046875, -7.668701171875, -7.107421875, -6.546142578125, -5.98486328125, -5.423583984375, -4.8623046875, -4.301025390625, -3.73974609375, -3.178466796875, -2.6171875, -2.055908203125, -1.49462890625, -0.933349609375, -0.3720703125, 0.189208984375, 0.75048828125, 1.311767578125, 1.873046875, 2.434326171875, 2.99560546875, 3.556884765625, 4.1181640625, 4.679443359375, 5.24072265625, 5.802001953125, 6.36328125, 6.924560546875, 7.48583984375, 8.047119140625, 8.6083984375, 9.169677734375, 9.73095703125, 10.292236328125, 10.853515625, 11.414794921875, 11.97607421875, 12.537353515625, 13.0986328125, 13.659912109375, 14.22119140625, 14.782470703125, 15.34375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 428.0, 575.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-521.4027099609375, -511.1947021484375, -500.9867248535156, -490.77874755859375, -480.57073974609375, -470.36273193359375, -460.1547546386719, -449.94677734375, -439.73876953125, -429.53076171875, -419.3227844238281, -409.11480712890625, -398.90679931640625, -388.69879150390625, -378.4908142089844, -368.2828369140625, -358.0748291015625, -347.8668212890625, -337.6588439941406, -327.45086669921875, -317.24285888671875, -307.03485107421875, -296.8268737792969, -286.618896484375, -276.410888671875, -266.202880859375, -255.99490356445312, -245.7869110107422, -235.57891845703125, -225.3709259033203, -215.16293334960938, -204.95494079589844, -194.74697875976562, -184.5389862060547, -174.33099365234375, -164.1230010986328, -153.91500854492188, -143.70701599121094, -133.4990234375, -123.29103088378906, -113.08303833007812, -102.87504577636719, -92.66705322265625, -82.45906066894531, -72.25106811523438, -62.04307556152344, -51.8350830078125, -41.62709045410156, -31.419097900390625, -21.211105346679688, -11.00311279296875, -0.7951202392578125, 9.412872314453125, 19.620864868164062, 29.828857421875, 40.03684997558594, 50.244842529296875, 60.45283508300781, 70.66082763671875, 80.86882019042969, 91.07681274414062, 101.28480529785156, 111.4927978515625, 121.70079040527344, 131.90878295898438]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 4.0, 0.0, 7.0, 8.0, 4.0, 11.0, 15.0, 14.0, 18.0, 19.0, 17.0, 18.0, 24.0, 31.0, 30.0, 25.0, 41.0, 36.0, 33.0, 33.0, 37.0, 40.0, 41.0, 31.0, 39.0, 37.0, 39.0, 29.0, 41.0, 25.0, 24.0, 22.0, 19.0, 20.0, 16.0, 20.0, 18.0, 18.0, 12.0, 20.0, 7.0, 8.0, 10.0, 7.0, 5.0, 4.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.811782836914062, -27.820764541625977, -26.82974624633789, -25.838729858398438, -24.84771156311035, -23.856693267822266, -22.86567497253418, -21.874656677246094, -20.88364028930664, -19.892621994018555, -18.90160369873047, -17.910587310791016, -16.91956901550293, -15.928550720214844, -14.937532424926758, -13.946514129638672, -12.955495834350586, -11.9644775390625, -10.97346019744873, -9.982441902160645, -8.991424560546875, -8.000406265258789, -7.009387969970703, -6.018370151519775, -5.027352333068848, -4.03633451461792, -3.045316457748413, -2.0542984008789062, -1.0632805824279785, -0.07226276397705078, 0.9187555313110352, 1.909773349761963, 2.9007911682128906, 3.8918089866638184, 4.882826805114746, 5.873845100402832, 6.86486291885376, 7.8558807373046875, 8.846899032592773, 9.83791732788086, 10.828934669494629, 11.819952964782715, 12.810970306396484, 13.80198860168457, 14.793006896972656, 15.784024238586426, 16.775043487548828, 17.76605987548828, 18.757078170776367, 19.748096466064453, 20.73911476135254, 21.730133056640625, 22.721149444580078, 23.712167739868164, 24.70318603515625, 25.694204330444336, 26.685222625732422, 27.676240921020508, 28.667259216308594, 29.658275604248047, 30.649293899536133, 31.64031219482422, 32.63133239746094, 33.62234878540039, 34.613365173339844]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 8.0, 5.0, 1.0, 10.0, 14.0, 7.0, 15.0, 18.0, 21.0, 23.0, 22.0, 14.0, 34.0, 29.0, 31.0, 24.0, 34.0, 32.0, 28.0, 29.0, 31.0, 46.0, 34.0, 52.0, 50.0, 47.0, 36.0, 28.0, 36.0, 32.0, 22.0, 22.0, 22.0, 18.0, 16.0, 17.0, 14.0, 12.0, 9.0, 10.0, 7.0, 6.0, 6.0, 7.0, 7.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.51953125, -4.37347412109375, -4.2274169921875, -4.08135986328125, -3.935302734375, -3.78924560546875, -3.6431884765625, -3.49713134765625, -3.35107421875, -3.20501708984375, -3.0589599609375, -2.91290283203125, -2.766845703125, -2.62078857421875, -2.4747314453125, -2.32867431640625, -2.1826171875, -2.03656005859375, -1.8905029296875, -1.74444580078125, -1.598388671875, -1.45233154296875, -1.3062744140625, -1.16021728515625, -1.01416015625, -0.86810302734375, -0.7220458984375, -0.57598876953125, -0.429931640625, -0.28387451171875, -0.1378173828125, 0.00823974609375, 0.154296875, 0.30035400390625, 0.4464111328125, 0.59246826171875, 0.738525390625, 0.88458251953125, 1.0306396484375, 1.17669677734375, 1.32275390625, 1.46881103515625, 1.6148681640625, 1.76092529296875, 1.906982421875, 2.05303955078125, 2.1990966796875, 2.34515380859375, 2.4912109375, 2.63726806640625, 2.7833251953125, 2.92938232421875, 3.075439453125, 3.22149658203125, 3.3675537109375, 3.51361083984375, 3.65966796875, 3.80572509765625, 3.9517822265625, 4.09783935546875, 4.243896484375, 4.38995361328125, 4.5360107421875, 4.68206787109375, 4.828125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 5.0, 17.0, 20.0, 17.0, 22.0, 31.0, 43.0, 58.0, 71.0, 143.0, 238.0, 429.0, 835.0, 1574.0, 3463.0, 7499.0, 18503.0, 51170.0, 175510.0, 1035034.0, 2350479.0, 402694.0, 94450.0, 30591.0, 11590.0, 5051.0, 2185.0, 1090.0, 558.0, 302.0, 198.0, 126.0, 73.0, 55.0, 39.0, 27.0, 18.0, 20.0, 10.0, 7.0, 8.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-12.71875, -12.3580322265625, -11.997314453125, -11.6365966796875, -11.27587890625, -10.9151611328125, -10.554443359375, -10.1937255859375, -9.8330078125, -9.4722900390625, -9.111572265625, -8.7508544921875, -8.39013671875, -8.0294189453125, -7.668701171875, -7.3079833984375, -6.947265625, -6.5865478515625, -6.225830078125, -5.8651123046875, -5.50439453125, -5.1436767578125, -4.782958984375, -4.4222412109375, -4.0615234375, -3.7008056640625, -3.340087890625, -2.9793701171875, -2.61865234375, -2.2579345703125, -1.897216796875, -1.5364990234375, -1.17578125, -0.8150634765625, -0.454345703125, -0.0936279296875, 0.26708984375, 0.6278076171875, 0.988525390625, 1.3492431640625, 1.7099609375, 2.0706787109375, 2.431396484375, 2.7921142578125, 3.15283203125, 3.5135498046875, 3.874267578125, 4.2349853515625, 4.595703125, 4.9564208984375, 5.317138671875, 5.6778564453125, 6.03857421875, 6.3992919921875, 6.760009765625, 7.1207275390625, 7.4814453125, 7.8421630859375, 8.202880859375, 8.5635986328125, 8.92431640625, 9.2850341796875, 9.645751953125, 10.0064697265625, 10.3671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 7.0, 7.0, 8.0, 8.0, 12.0, 25.0, 20.0, 43.0, 60.0, 80.0, 109.0, 185.0, 206.0, 315.0, 460.0, 623.0, 612.0, 396.0, 262.0, 187.0, 135.0, 75.0, 70.0, 49.0, 31.0, 31.0, 21.0, 16.0, 2.0, 8.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7421875, -11.41357421875, -11.0849609375, -10.75634765625, -10.427734375, -10.09912109375, -9.7705078125, -9.44189453125, -9.11328125, -8.78466796875, -8.4560546875, -8.12744140625, -7.798828125, -7.47021484375, -7.1416015625, -6.81298828125, -6.484375, -6.15576171875, -5.8271484375, -5.49853515625, -5.169921875, -4.84130859375, -4.5126953125, -4.18408203125, -3.85546875, -3.52685546875, -3.1982421875, -2.86962890625, -2.541015625, -2.21240234375, -1.8837890625, -1.55517578125, -1.2265625, -0.89794921875, -0.5693359375, -0.24072265625, 0.087890625, 0.41650390625, 0.7451171875, 1.07373046875, 1.40234375, 1.73095703125, 2.0595703125, 2.38818359375, 2.716796875, 3.04541015625, 3.3740234375, 3.70263671875, 4.03125, 4.35986328125, 4.6884765625, 5.01708984375, 5.345703125, 5.67431640625, 6.0029296875, 6.33154296875, 6.66015625, 6.98876953125, 7.3173828125, 7.64599609375, 7.974609375, 8.30322265625, 8.6318359375, 8.96044921875, 9.2890625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 13.0, 10.0, 26.0, 34.0, 57.0, 93.0, 192.0, 374.0, 663.0, 1318.0, 2797.0, 6796.0, 17014.0, 50569.0, 174124.0, 819274.0, 2434485.0, 505885.0, 120699.0, 36941.0, 13141.0, 5341.0, 2209.0, 1012.0, 544.0, 287.0, 147.0, 93.0, 49.0, 30.0, 19.0, 10.0, 14.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.453125, -14.0198974609375, -13.586669921875, -13.1534423828125, -12.72021484375, -12.2869873046875, -11.853759765625, -11.4205322265625, -10.9873046875, -10.5540771484375, -10.120849609375, -9.6876220703125, -9.25439453125, -8.8211669921875, -8.387939453125, -7.9547119140625, -7.521484375, -7.0882568359375, -6.655029296875, -6.2218017578125, -5.78857421875, -5.3553466796875, -4.922119140625, -4.4888916015625, -4.0556640625, -3.6224365234375, -3.189208984375, -2.7559814453125, -2.32275390625, -1.8895263671875, -1.456298828125, -1.0230712890625, -0.58984375, -0.1566162109375, 0.276611328125, 0.7098388671875, 1.14306640625, 1.5762939453125, 2.009521484375, 2.4427490234375, 2.8759765625, 3.3092041015625, 3.742431640625, 4.1756591796875, 4.60888671875, 5.0421142578125, 5.475341796875, 5.9085693359375, 6.341796875, 6.7750244140625, 7.208251953125, 7.6414794921875, 8.07470703125, 8.5079345703125, 8.941162109375, 9.3743896484375, 9.8076171875, 10.2408447265625, 10.674072265625, 11.1072998046875, 11.54052734375, 11.9737548828125, 12.406982421875, 12.8402099609375, 13.2734375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 18.0, 69.0, 167.0, 303.0, 271.0, 131.0, 40.0, 17.0, 1.0, 0.0, 0.0, 1.0], "bins": [-226.2356414794922, -222.1863555908203, -218.13705444335938, -214.0877685546875, -210.03848266601562, -205.98919677734375, -201.9398956298828, -197.89060974121094, -193.84130859375, -189.79202270507812, -185.7427215576172, -181.6934356689453, -177.64414978027344, -173.5948486328125, -169.54556274414062, -165.49627685546875, -161.44699096679688, -157.397705078125, -153.34840393066406, -149.2991180419922, -145.2498321533203, -141.20053100585938, -137.1512451171875, -133.10195922851562, -129.05267333984375, -125.00337982177734, -120.95409393310547, -116.90480041503906, -112.85551452636719, -108.80622100830078, -104.75692749023438, -100.7076416015625, -96.6583480834961, -92.60905456542969, -88.55976867675781, -84.5104751586914, -80.461181640625, -76.41189575195312, -72.36260223388672, -68.31330871582031, -64.26402282714844, -60.2147331237793, -56.165443420410156, -52.11614990234375, -48.06686019897461, -44.01757049560547, -39.96827697753906, -35.91898727416992, -31.86969757080078, -27.82040786743164, -23.771116256713867, -19.721824645996094, -15.672534942626953, -11.623245239257812, -7.573953628540039, -3.5246620178222656, 0.524627685546875, 4.573918342590332, 8.623208999633789, 12.672499656677246, 16.721790313720703, 20.771080017089844, 24.820371627807617, 28.86966323852539, 32.91895294189453]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 10.0, 10.0, 9.0, 14.0, 15.0, 21.0, 17.0, 20.0, 23.0, 40.0, 34.0, 26.0, 44.0, 32.0, 39.0, 41.0, 37.0, 42.0, 43.0, 45.0, 40.0, 41.0, 45.0, 33.0, 29.0, 27.0, 35.0, 20.0, 30.0, 18.0, 23.0, 18.0, 13.0, 10.0, 10.0, 12.0, 6.0, 4.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.787132263183594, -30.783100128173828, -29.779069900512695, -28.775039672851562, -27.771007537841797, -26.76697540283203, -25.7629451751709, -24.758914947509766, -23.7548828125, -22.750850677490234, -21.7468204498291, -20.74279022216797, -19.738758087158203, -18.734725952148438, -17.730695724487305, -16.726665496826172, -15.722633361816406, -14.718602180480957, -13.714570999145508, -12.710539817810059, -11.70650863647461, -10.70247745513916, -9.698446273803711, -8.694415092468262, -7.6903839111328125, -6.686352729797363, -5.682321548461914, -4.678290367126465, -3.6742591857910156, -2.6702280044555664, -1.6661968231201172, -0.662165641784668, 0.3418693542480469, 1.345900535583496, 2.3499317169189453, 3.3539628982543945, 4.357994079589844, 5.362025260925293, 6.366056442260742, 7.370087623596191, 8.37411880493164, 9.37814998626709, 10.382181167602539, 11.386212348937988, 12.390243530273438, 13.394274711608887, 14.398305892944336, 15.402337074279785, 16.406368255615234, 17.410400390625, 18.414430618286133, 19.418460845947266, 20.42249298095703, 21.426525115966797, 22.43055534362793, 23.434585571289062, 24.438617706298828, 25.442649841308594, 26.446680068969727, 27.45071029663086, 28.454742431640625, 29.45877456665039, 30.462804794311523, 31.466835021972656, 32.47086715698242]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 8.0, 7.0, 16.0, 13.0, 8.0, 13.0, 33.0, 15.0, 26.0, 31.0, 35.0, 32.0, 41.0, 39.0, 42.0, 37.0, 36.0, 57.0, 37.0, 46.0, 41.0, 44.0, 48.0, 45.0, 27.0, 27.0, 31.0, 31.0, 16.0, 17.0, 15.0, 17.0, 13.0, 12.0, 6.0, 8.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.53515625, -6.34893798828125, -6.1627197265625, -5.97650146484375, -5.790283203125, -5.60406494140625, -5.4178466796875, -5.23162841796875, -5.04541015625, -4.85919189453125, -4.6729736328125, -4.48675537109375, -4.300537109375, -4.11431884765625, -3.9281005859375, -3.74188232421875, -3.5556640625, -3.36944580078125, -3.1832275390625, -2.99700927734375, -2.810791015625, -2.62457275390625, -2.4383544921875, -2.25213623046875, -2.06591796875, -1.87969970703125, -1.6934814453125, -1.50726318359375, -1.321044921875, -1.13482666015625, -0.9486083984375, -0.76239013671875, -0.576171875, -0.38995361328125, -0.2037353515625, -0.01751708984375, 0.168701171875, 0.35491943359375, 0.5411376953125, 0.72735595703125, 0.91357421875, 1.09979248046875, 1.2860107421875, 1.47222900390625, 1.658447265625, 1.84466552734375, 2.0308837890625, 2.21710205078125, 2.4033203125, 2.58953857421875, 2.7757568359375, 2.96197509765625, 3.148193359375, 3.33441162109375, 3.5206298828125, 3.70684814453125, 3.89306640625, 4.07928466796875, 4.2655029296875, 4.45172119140625, 4.637939453125, 4.82415771484375, 5.0103759765625, 5.19659423828125, 5.3828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 10.0, 7.0, 6.0, 18.0, 28.0, 49.0, 88.0, 102.0, 165.0, 246.0, 370.0, 509.0, 741.0, 1133.0, 1684.0, 2589.0, 4089.0, 6371.0, 10143.0, 16447.0, 27098.0, 47168.0, 85006.0, 170141.0, 346329.0, 145570.0, 74894.0, 42064.0, 24778.0, 14834.0, 9240.0, 5802.0, 3755.0, 2376.0, 1572.0, 996.0, 682.0, 485.0, 301.0, 232.0, 151.0, 101.0, 73.0, 32.0, 30.0, 20.0, 10.0, 11.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 1.0], "bins": [-0.43408203125, -0.4210853576660156, -0.40808868408203125, -0.3950920104980469, -0.3820953369140625, -0.3690986633300781, -0.35610198974609375, -0.3431053161621094, -0.330108642578125, -0.3171119689941406, -0.30411529541015625, -0.2911186218261719, -0.2781219482421875, -0.2651252746582031, -0.25212860107421875, -0.23913192749023438, -0.22613525390625, -0.21313858032226562, -0.20014190673828125, -0.18714523315429688, -0.1741485595703125, -0.16115188598632812, -0.14815521240234375, -0.13515853881835938, -0.122161865234375, -0.10916519165039062, -0.09616851806640625, -0.08317184448242188, -0.0701751708984375, -0.057178497314453125, -0.04418182373046875, -0.031185150146484375, -0.0181884765625, -0.005191802978515625, 0.00780487060546875, 0.020801544189453125, 0.0337982177734375, 0.046794891357421875, 0.05979156494140625, 0.07278823852539062, 0.085784912109375, 0.09878158569335938, 0.11177825927734375, 0.12477493286132812, 0.1377716064453125, 0.15076828002929688, 0.16376495361328125, 0.17676162719726562, 0.18975830078125, 0.20275497436523438, 0.21575164794921875, 0.22874832153320312, 0.2417449951171875, 0.2547416687011719, 0.26773834228515625, 0.2807350158691406, 0.293731689453125, 0.3067283630371094, 0.31972503662109375, 0.3327217102050781, 0.3457183837890625, 0.3587150573730469, 0.37171173095703125, 0.3847084045410156, 0.397705078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 4.0, 8.0, 13.0, 10.0, 10.0, 13.0, 18.0, 20.0, 22.0, 26.0, 26.0, 18.0, 33.0, 32.0, 36.0, 37.0, 39.0, 47.0, 44.0, 1066.0, 49.0, 42.0, 49.0, 44.0, 31.0, 42.0, 32.0, 17.0, 18.0, 21.0, 25.0, 20.0, 19.0, 11.0, 14.0, 17.0, 12.0, 12.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.44140625, -4.311737060546875, -4.18206787109375, -4.052398681640625, -3.9227294921875, -3.793060302734375, -3.66339111328125, -3.533721923828125, -3.404052734375, -3.274383544921875, -3.14471435546875, -3.015045166015625, -2.8853759765625, -2.755706787109375, -2.62603759765625, -2.496368408203125, -2.36669921875, -2.237030029296875, -2.10736083984375, -1.977691650390625, -1.8480224609375, -1.718353271484375, -1.58868408203125, -1.459014892578125, -1.329345703125, -1.199676513671875, -1.07000732421875, -0.940338134765625, -0.8106689453125, -0.680999755859375, -0.55133056640625, -0.421661376953125, -0.2919921875, -0.162322998046875, -0.03265380859375, 0.097015380859375, 0.2266845703125, 0.356353759765625, 0.48602294921875, 0.615692138671875, 0.745361328125, 0.875030517578125, 1.00469970703125, 1.134368896484375, 1.2640380859375, 1.393707275390625, 1.52337646484375, 1.653045654296875, 1.78271484375, 1.912384033203125, 2.04205322265625, 2.171722412109375, 2.3013916015625, 2.431060791015625, 2.56072998046875, 2.690399169921875, 2.820068359375, 2.949737548828125, 3.07940673828125, 3.209075927734375, 3.3387451171875, 3.468414306640625, 3.59808349609375, 3.727752685546875, 3.857421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 9.0, 12.0, 13.0, 35.0, 36.0, 59.0, 98.0, 116.0, 171.0, 267.0, 372.0, 598.0, 860.0, 1329.0, 1928.0, 2969.0, 4537.0, 7020.0, 11183.0, 17640.0, 29049.0, 51028.0, 99011.0, 280352.0, 1353576.0, 102221.0, 52454.0, 30187.0, 17950.0, 11199.0, 7156.0, 4573.0, 3012.0, 2038.0, 1305.0, 908.0, 554.0, 409.0, 293.0, 202.0, 121.0, 76.0, 69.0, 41.0, 27.0, 24.0, 10.0, 11.0, 11.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2527656555175781, -0.24405670166015625, -0.23534774780273438, -0.2266387939453125, -0.21792984008789062, -0.20922088623046875, -0.20051193237304688, -0.191802978515625, -0.18309402465820312, -0.17438507080078125, -0.16567611694335938, -0.1569671630859375, -0.14825820922851562, -0.13954925537109375, -0.13084030151367188, -0.12213134765625, -0.11342239379882812, -0.10471343994140625, -0.09600448608398438, -0.0872955322265625, -0.07858657836914062, -0.06987762451171875, -0.061168670654296875, -0.052459716796875, -0.043750762939453125, -0.03504180908203125, -0.026332855224609375, -0.0176239013671875, -0.008914947509765625, -0.00020599365234375, 0.008502960205078125, 0.0172119140625, 0.025920867919921875, 0.03462982177734375, 0.043338775634765625, 0.0520477294921875, 0.060756683349609375, 0.06946563720703125, 0.07817459106445312, 0.086883544921875, 0.09559249877929688, 0.10430145263671875, 0.11301040649414062, 0.1217193603515625, 0.13042831420898438, 0.13913726806640625, 0.14784622192382812, 0.15655517578125, 0.16526412963867188, 0.17397308349609375, 0.18268203735351562, 0.1913909912109375, 0.20009994506835938, 0.20880889892578125, 0.21751785278320312, 0.226226806640625, 0.23493576049804688, 0.24364471435546875, 0.2523536682128906, 0.2610626220703125, 0.2697715759277344, 0.27848052978515625, 0.2871894836425781, 0.2958984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 7.0, 7.0, 6.0, 9.0, 16.0, 14.0, 16.0, 25.0, 38.0, 47.0, 74.0, 110.0, 180.0, 146.0, 87.0, 60.0, 38.0, 20.0, 16.0, 16.0, 18.0, 8.0, 9.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3066997528076172e-05, -2.2094696760177612e-05, -2.1122395992279053e-05, -2.0150095224380493e-05, -1.9177794456481934e-05, -1.8205493688583374e-05, -1.7233192920684814e-05, -1.6260892152786255e-05, -1.5288591384887695e-05, -1.4316290616989136e-05, -1.3343989849090576e-05, -1.2371689081192017e-05, -1.1399388313293457e-05, -1.0427087545394897e-05, -9.454786777496338e-06, -8.482486009597778e-06, -7.510185241699219e-06, -6.537884473800659e-06, -5.5655837059021e-06, -4.59328293800354e-06, -3.6209821701049805e-06, -2.648681402206421e-06, -1.6763806343078613e-06, -7.040798664093018e-07, 2.682209014892578e-07, 1.2405216693878174e-06, 2.212822437286377e-06, 3.1851232051849365e-06, 4.157423973083496e-06, 5.129724740982056e-06, 6.102025508880615e-06, 7.074326276779175e-06, 8.046627044677734e-06, 9.018927812576294e-06, 9.991228580474854e-06, 1.0963529348373413e-05, 1.1935830116271973e-05, 1.2908130884170532e-05, 1.3880431652069092e-05, 1.4852732419967651e-05, 1.582503318786621e-05, 1.679733395576477e-05, 1.776963472366333e-05, 1.874193549156189e-05, 1.971423625946045e-05, 2.068653702735901e-05, 2.165883779525757e-05, 2.2631138563156128e-05, 2.3603439331054688e-05, 2.4575740098953247e-05, 2.5548040866851807e-05, 2.6520341634750366e-05, 2.7492642402648926e-05, 2.8464943170547485e-05, 2.9437243938446045e-05, 3.0409544706344604e-05, 3.1381845474243164e-05, 3.2354146242141724e-05, 3.332644701004028e-05, 3.429874777793884e-05, 3.52710485458374e-05, 3.624334931373596e-05, 3.721565008163452e-05, 3.818795084953308e-05, 3.916025161743164e-05]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 3.0, 11.0, 9.0, 5.0, 11.0, 14.0, 18.0, 20.0, 38.0, 60.0, 139.0, 356.0, 7250.0, 1010299.0, 29368.0, 508.0, 184.0, 94.0, 42.0, 25.0, 18.0, 14.0, 18.0, 12.0, 5.0, 10.0, 2.0, 5.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0008668899536132812, -0.0008450150489807129, -0.0008231401443481445, -0.0008012652397155762, -0.0007793903350830078, -0.0007575154304504395, -0.0007356405258178711, -0.0007137656211853027, -0.0006918907165527344, -0.000670015811920166, -0.0006481409072875977, -0.0006262660026550293, -0.0006043910980224609, -0.0005825161933898926, -0.0005606412887573242, -0.0005387663841247559, -0.0005168914794921875, -0.0004950165748596191, -0.0004731416702270508, -0.0004512667655944824, -0.00042939186096191406, -0.0004075169563293457, -0.00038564205169677734, -0.000363767147064209, -0.0003418922424316406, -0.00032001733779907227, -0.0002981424331665039, -0.00027626752853393555, -0.0002543926239013672, -0.00023251771926879883, -0.00021064281463623047, -0.0001887679100036621, -0.00016689300537109375, -0.0001450181007385254, -0.00012314319610595703, -0.00010126829147338867, -7.939338684082031e-05, -5.751848220825195e-05, -3.5643577575683594e-05, -1.3768672943115234e-05, 8.106231689453125e-06, 2.9981136322021484e-05, 5.1856040954589844e-05, 7.37309455871582e-05, 9.560585021972656e-05, 0.00011748075485229492, 0.00013935565948486328, 0.00016123056411743164, 0.00018310546875, 0.00020498037338256836, 0.00022685527801513672, 0.0002487301826477051, 0.00027060508728027344, 0.0002924799919128418, 0.00031435489654541016, 0.0003362298011779785, 0.0003581047058105469, 0.00037997961044311523, 0.0004018545150756836, 0.00042372941970825195, 0.0004456043243408203, 0.00046747922897338867, 0.000489354133605957, 0.0005112290382385254, 0.0005331039428710938]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 26.0, 138.0, 446.0, 330.0, 62.0, 10.0], "bins": [-0.0001641549461055547, -0.00016145301924552768, -0.0001587511069374159, -0.00015604918007738888, -0.0001533472677692771, -0.00015064534090925008, -0.0001479434286011383, -0.00014524150174111128, -0.0001425395894329995, -0.00013983766257297248, -0.0001371357502648607, -0.00013443382340483367, -0.0001317319110967219, -0.00012902998423669487, -0.00012632807192858309, -0.00012362614506855607, -0.00012092421820852906, -0.00011822229862445965, -0.00011552037904039025, -0.00011281845945632085, -0.00011011653987225145, -0.00010741461301222444, -0.00010471270070411265, -0.00010201077384408563, -9.930886153597385e-05, -9.660694195190445e-05, -9.390502236783504e-05, -9.120310278376564e-05, -8.850118319969624e-05, -8.579925633966923e-05, -8.309734403155744e-05, -8.039541717153043e-05, -7.769349758746102e-05, -7.499157800339162e-05, -7.228965841932222e-05, -6.958773883525282e-05, -6.688581925118342e-05, -6.418389966711402e-05, -6.1481972807087e-05, -5.87800532230176e-05, -5.607813727692701e-05, -5.337621769285761e-05, -5.067429810878821e-05, -4.797237488674e-05, -4.52704553026706e-05, -4.25685357186012e-05, -3.9866616134531796e-05, -3.7164696550462395e-05, -3.446277332841419e-05, -3.1760853744344786e-05, -2.905893234128598e-05, -2.635701275721658e-05, -2.3655091354157776e-05, -2.0953171770088375e-05, -1.8251252186018974e-05, -1.554933078296017e-05, -1.284741210838547e-05, -1.0145491614821367e-05, -7.443571576004615e-06, -4.741651537187863e-06, -2.0397310436237603e-06, 6.621894499403425e-07, 3.3641090340097435e-06, 6.066030437068548e-06, 8.767950021137949e-06]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 8.0, 15.0, 20.0, 12.0, 10.0, 20.0, 24.0, 17.0, 38.0, 27.0, 36.0, 31.0, 45.0, 50.0, 38.0, 54.0, 38.0, 46.0, 55.0, 45.0, 43.0, 30.0, 38.0, 36.0, 30.0, 27.0, 23.0, 20.0, 33.0, 24.0, 17.0, 7.0, 5.0, 15.0, 8.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2218952178955078e-05, -1.1838041245937347e-05, -1.1457130312919617e-05, -1.1076219379901886e-05, -1.0695308446884155e-05, -1.0314397513866425e-05, -9.933486580848694e-06, -9.552575647830963e-06, -9.171664714813232e-06, -8.790753781795502e-06, -8.409842848777771e-06, -8.02893191576004e-06, -7.64802098274231e-06, -7.267110049724579e-06, -6.886199116706848e-06, -6.5052881836891174e-06, -6.124377250671387e-06, -5.743466317653656e-06, -5.362555384635925e-06, -4.981644451618195e-06, -4.600733518600464e-06, -4.219822585582733e-06, -3.8389116525650024e-06, -3.4580007195472717e-06, -3.077089786529541e-06, -2.6961788535118103e-06, -2.3152679204940796e-06, -1.934356987476349e-06, -1.5534460544586182e-06, -1.1725351214408875e-06, -7.916241884231567e-07, -4.10713255405426e-07, -2.9802322387695312e-08, 3.511086106300354e-07, 7.320195436477661e-07, 1.1129304766654968e-06, 1.4938414096832275e-06, 1.8747523427009583e-06, 2.255663275718689e-06, 2.6365742087364197e-06, 3.0174851417541504e-06, 3.398396074771881e-06, 3.779307007789612e-06, 4.1602179408073425e-06, 4.541128873825073e-06, 4.922039806842804e-06, 5.302950739860535e-06, 5.683861672878265e-06, 6.064772605895996e-06, 6.445683538913727e-06, 6.8265944719314575e-06, 7.207505404949188e-06, 7.588416337966919e-06, 7.96932727098465e-06, 8.35023820400238e-06, 8.731149137020111e-06, 9.112060070037842e-06, 9.492971003055573e-06, 9.873881936073303e-06, 1.0254792869091034e-05, 1.0635703802108765e-05, 1.1016614735126495e-05, 1.1397525668144226e-05, 1.1778436601161957e-05, 1.2159347534179688e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 8.0, 7.0, 16.0, 13.0, 8.0, 13.0, 33.0, 15.0, 26.0, 31.0, 35.0, 32.0, 41.0, 39.0, 42.0, 37.0, 36.0, 57.0, 37.0, 46.0, 41.0, 44.0, 48.0, 45.0, 27.0, 27.0, 31.0, 31.0, 16.0, 17.0, 15.0, 17.0, 13.0, 12.0, 6.0, 8.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.53515625, -6.34893798828125, -6.1627197265625, -5.97650146484375, -5.790283203125, -5.60406494140625, -5.4178466796875, -5.23162841796875, -5.04541015625, -4.85919189453125, -4.6729736328125, -4.48675537109375, -4.300537109375, -4.11431884765625, -3.9281005859375, -3.74188232421875, -3.5556640625, -3.36944580078125, -3.1832275390625, -2.99700927734375, -2.810791015625, -2.62457275390625, -2.4383544921875, -2.25213623046875, -2.06591796875, -1.87969970703125, -1.6934814453125, -1.50726318359375, -1.321044921875, -1.13482666015625, -0.9486083984375, -0.76239013671875, -0.576171875, -0.38995361328125, -0.2037353515625, -0.01751708984375, 0.168701171875, 0.35491943359375, 0.5411376953125, 0.72735595703125, 0.91357421875, 1.09979248046875, 1.2860107421875, 1.47222900390625, 1.658447265625, 1.84466552734375, 2.0308837890625, 2.21710205078125, 2.4033203125, 2.58953857421875, 2.7757568359375, 2.96197509765625, 3.148193359375, 3.33441162109375, 3.5206298828125, 3.70684814453125, 3.89306640625, 4.07928466796875, 4.2655029296875, 4.45172119140625, 4.637939453125, 4.82415771484375, 5.0103759765625, 5.19659423828125, 5.3828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 11.0, 12.0, 22.0, 37.0, 64.0, 90.0, 131.0, 287.0, 470.0, 853.0, 1457.0, 2685.0, 4512.0, 7648.0, 13222.0, 23016.0, 40763.0, 85709.0, 227021.0, 352282.0, 150825.0, 61365.0, 31905.0, 18570.0, 10784.0, 6318.0, 3658.0, 2074.0, 1145.0, 708.0, 375.0, 211.0, 134.0, 65.0, 47.0, 25.0, 20.0, 18.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.858154296875, -6.60693359375, -6.355712890625, -6.1044921875, -5.853271484375, -5.60205078125, -5.350830078125, -5.099609375, -4.848388671875, -4.59716796875, -4.345947265625, -4.0947265625, -3.843505859375, -3.59228515625, -3.341064453125, -3.08984375, -2.838623046875, -2.58740234375, -2.336181640625, -2.0849609375, -1.833740234375, -1.58251953125, -1.331298828125, -1.080078125, -0.828857421875, -0.57763671875, -0.326416015625, -0.0751953125, 0.176025390625, 0.42724609375, 0.678466796875, 0.9296875, 1.180908203125, 1.43212890625, 1.683349609375, 1.9345703125, 2.185791015625, 2.43701171875, 2.688232421875, 2.939453125, 3.190673828125, 3.44189453125, 3.693115234375, 3.9443359375, 4.195556640625, 4.44677734375, 4.697998046875, 4.94921875, 5.200439453125, 5.45166015625, 5.702880859375, 5.9541015625, 6.205322265625, 6.45654296875, 6.707763671875, 6.958984375, 7.210205078125, 7.46142578125, 7.712646484375, 7.9638671875, 8.215087890625, 8.46630859375, 8.717529296875, 8.96875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 4.0, 0.0, 5.0, 3.0, 9.0, 11.0, 9.0, 8.0, 9.0, 9.0, 14.0, 28.0, 22.0, 33.0, 24.0, 34.0, 47.0, 32.0, 53.0, 76.0, 105.0, 159.0, 309.0, 1307.0, 164.0, 93.0, 69.0, 63.0, 45.0, 38.0, 23.0, 24.0, 31.0, 24.0, 24.0, 20.0, 21.0, 12.0, 23.0, 14.0, 1.0, 11.0, 8.0, 4.0, 9.0, 4.0, 4.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0], "bins": [-14.3359375, -13.91455078125, -13.4931640625, -13.07177734375, -12.650390625, -12.22900390625, -11.8076171875, -11.38623046875, -10.96484375, -10.54345703125, -10.1220703125, -9.70068359375, -9.279296875, -8.85791015625, -8.4365234375, -8.01513671875, -7.59375, -7.17236328125, -6.7509765625, -6.32958984375, -5.908203125, -5.48681640625, -5.0654296875, -4.64404296875, -4.22265625, -3.80126953125, -3.3798828125, -2.95849609375, -2.537109375, -2.11572265625, -1.6943359375, -1.27294921875, -0.8515625, -0.43017578125, -0.0087890625, 0.41259765625, 0.833984375, 1.25537109375, 1.6767578125, 2.09814453125, 2.51953125, 2.94091796875, 3.3623046875, 3.78369140625, 4.205078125, 4.62646484375, 5.0478515625, 5.46923828125, 5.890625, 6.31201171875, 6.7333984375, 7.15478515625, 7.576171875, 7.99755859375, 8.4189453125, 8.84033203125, 9.26171875, 9.68310546875, 10.1044921875, 10.52587890625, 10.947265625, 11.36865234375, 11.7900390625, 12.21142578125, 12.6328125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 10.0, 15.0, 13.0, 21.0, 35.0, 47.0, 60.0, 114.0, 147.0, 270.0, 653.0, 1924.0, 8011.0, 44759.0, 554271.0, 2410081.0, 104252.0, 15818.0, 3293.0, 981.0, 358.0, 178.0, 111.0, 79.0, 51.0, 44.0, 18.0, 19.0, 10.0, 5.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.5625, -23.844482421875, -23.12646484375, -22.408447265625, -21.6904296875, -20.972412109375, -20.25439453125, -19.536376953125, -18.818359375, -18.100341796875, -17.38232421875, -16.664306640625, -15.9462890625, -15.228271484375, -14.51025390625, -13.792236328125, -13.07421875, -12.356201171875, -11.63818359375, -10.920166015625, -10.2021484375, -9.484130859375, -8.76611328125, -8.048095703125, -7.330078125, -6.612060546875, -5.89404296875, -5.176025390625, -4.4580078125, -3.739990234375, -3.02197265625, -2.303955078125, -1.5859375, -0.867919921875, -0.14990234375, 0.568115234375, 1.2861328125, 2.004150390625, 2.72216796875, 3.440185546875, 4.158203125, 4.876220703125, 5.59423828125, 6.312255859375, 7.0302734375, 7.748291015625, 8.46630859375, 9.184326171875, 9.90234375, 10.620361328125, 11.33837890625, 12.056396484375, 12.7744140625, 13.492431640625, 14.21044921875, 14.928466796875, 15.646484375, 16.364501953125, 17.08251953125, 17.800537109375, 18.5185546875, 19.236572265625, 19.95458984375, 20.672607421875, 21.390625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 53.0, 243.0, 476.0, 204.0, 24.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.486019134521484, -38.35768127441406, -33.229347229003906, -28.101011276245117, -22.972675323486328, -17.84433937072754, -12.71600341796875, -7.587665557861328, -2.459331512451172, 2.669004440307617, 7.797340393066406, 12.925676345825195, 18.054012298583984, 23.182348251342773, 28.310684204101562, 33.439022064208984, 38.56735610961914, 43.69569396972656, 48.82402801513672, 53.952362060546875, 59.0806999206543, 64.20903778076172, 69.33737182617188, 74.46571350097656, 79.59403991699219, 84.72237396240234, 89.8507080078125, 94.97904968261719, 100.10738372802734, 105.2357177734375, 110.36405944824219, 115.49239349365234, 120.6207275390625, 125.74906158447266, 130.8773956298828, 136.0057373046875, 141.13406372070312, 146.2624053955078, 151.3907470703125, 156.51907348632812, 161.6474151611328, 166.7757568359375, 171.90408325195312, 177.0324249267578, 182.1607666015625, 187.28909301757812, 192.4174346923828, 197.5457763671875, 202.67410278320312, 207.8024444580078, 212.93077087402344, 218.05911254882812, 223.18743896484375, 228.31578063964844, 233.44412231445312, 238.57244873046875, 243.70079040527344, 248.82913208007812, 253.95745849609375, 259.0857849121094, 264.2141418457031, 269.34246826171875, 274.4707946777344, 279.5991516113281, 284.72747802734375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 7.0, 7.0, 9.0, 10.0, 14.0, 15.0, 16.0, 14.0, 11.0, 17.0, 28.0, 30.0, 29.0, 25.0, 40.0, 45.0, 46.0, 35.0, 32.0, 45.0, 46.0, 40.0, 21.0, 39.0, 36.0, 29.0, 27.0, 30.0, 33.0, 28.0, 26.0, 23.0, 27.0, 20.0, 14.0, 15.0, 18.0, 4.0, 12.0, 6.0, 6.0, 8.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.648040771484375, -31.517911911010742, -30.387784957885742, -29.25765609741211, -28.12752914428711, -26.997400283813477, -25.867271423339844, -24.737144470214844, -23.60701560974121, -22.476886749267578, -21.346759796142578, -20.216630935668945, -19.086502075195312, -17.956375122070312, -16.82624626159668, -15.696118354797363, -14.565990447998047, -13.43586254119873, -12.305734634399414, -11.175605773925781, -10.045477867126465, -8.915349960327148, -7.785221576690674, -6.655093193054199, -5.524965286254883, -4.394837379455566, -3.264708995819092, -2.1345808506011963, -1.0044527053833008, 0.12567520141601562, 1.2558035850524902, 2.385931968688965, 3.5160560607910156, 4.646183967590332, 5.776312351226807, 6.906440734863281, 8.036568641662598, 9.166696548461914, 10.296825408935547, 11.426953315734863, 12.55708122253418, 13.687209129333496, 14.817337036132812, 15.947465896606445, 17.077594757080078, 18.207721710205078, 19.33785057067871, 20.467979431152344, 21.598106384277344, 22.728235244750977, 23.858362197875977, 24.98849105834961, 26.11861801147461, 27.248746871948242, 28.378875732421875, 29.509002685546875, 30.639131546020508, 31.76926040649414, 32.89938735961914, 34.02951431274414, 35.159645080566406, 36.289772033691406, 37.419898986816406, 38.55002975463867, 39.68015670776367]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 5.0, 7.0, 12.0, 17.0, 13.0, 18.0, 17.0, 29.0, 20.0, 18.0, 25.0, 22.0, 42.0, 39.0, 33.0, 34.0, 47.0, 45.0, 38.0, 45.0, 39.0, 36.0, 37.0, 49.0, 40.0, 38.0, 34.0, 28.0, 24.0, 16.0, 23.0, 15.0, 17.0, 12.0, 14.0, 6.0, 13.0, 4.0, 9.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0], "bins": [-6.99609375, -6.8118896484375, -6.627685546875, -6.4434814453125, -6.25927734375, -6.0750732421875, -5.890869140625, -5.7066650390625, -5.5224609375, -5.3382568359375, -5.154052734375, -4.9698486328125, -4.78564453125, -4.6014404296875, -4.417236328125, -4.2330322265625, -4.048828125, -3.8646240234375, -3.680419921875, -3.4962158203125, -3.31201171875, -3.1278076171875, -2.943603515625, -2.7593994140625, -2.5751953125, -2.3909912109375, -2.206787109375, -2.0225830078125, -1.83837890625, -1.6541748046875, -1.469970703125, -1.2857666015625, -1.1015625, -0.9173583984375, -0.733154296875, -0.5489501953125, -0.36474609375, -0.1805419921875, 0.003662109375, 0.1878662109375, 0.3720703125, 0.5562744140625, 0.740478515625, 0.9246826171875, 1.10888671875, 1.2930908203125, 1.477294921875, 1.6614990234375, 1.845703125, 2.0299072265625, 2.214111328125, 2.3983154296875, 2.58251953125, 2.7667236328125, 2.950927734375, 3.1351318359375, 3.3193359375, 3.5035400390625, 3.687744140625, 3.8719482421875, 4.05615234375, 4.2403564453125, 4.424560546875, 4.6087646484375, 4.79296875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 10.0, 15.0, 13.0, 11.0, 21.0, 24.0, 38.0, 46.0, 59.0, 59.0, 88.0, 131.0, 189.0, 267.0, 409.0, 1464.0, 201133.0, 3982567.0, 6051.0, 510.0, 338.0, 237.0, 120.0, 110.0, 81.0, 56.0, 36.0, 38.0, 34.0, 23.0, 27.0, 15.0, 13.0, 8.0, 10.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-87.875, -85.3056640625, -82.736328125, -80.1669921875, -77.59765625, -75.0283203125, -72.458984375, -69.8896484375, -67.3203125, -64.7509765625, -62.181640625, -59.6123046875, -57.04296875, -54.4736328125, -51.904296875, -49.3349609375, -46.765625, -44.1962890625, -41.626953125, -39.0576171875, -36.48828125, -33.9189453125, -31.349609375, -28.7802734375, -26.2109375, -23.6416015625, -21.072265625, -18.5029296875, -15.93359375, -13.3642578125, -10.794921875, -8.2255859375, -5.65625, -3.0869140625, -0.517578125, 2.0517578125, 4.62109375, 7.1904296875, 9.759765625, 12.3291015625, 14.8984375, 17.4677734375, 20.037109375, 22.6064453125, 25.17578125, 27.7451171875, 30.314453125, 32.8837890625, 35.453125, 38.0224609375, 40.591796875, 43.1611328125, 45.73046875, 48.2998046875, 50.869140625, 53.4384765625, 56.0078125, 58.5771484375, 61.146484375, 63.7158203125, 66.28515625, 68.8544921875, 71.423828125, 73.9931640625, 76.5625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 3.0, 5.0, 6.0, 9.0, 13.0, 9.0, 10.0, 14.0, 28.0, 33.0, 34.0, 51.0, 85.0, 120.0, 166.0, 251.0, 380.0, 599.0, 680.0, 470.0, 305.0, 205.0, 151.0, 113.0, 67.0, 68.0, 35.0, 47.0, 29.0, 18.0, 17.0, 13.0, 9.0, 11.0, 6.0, 2.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8828125, -7.58349609375, -7.2841796875, -6.98486328125, -6.685546875, -6.38623046875, -6.0869140625, -5.78759765625, -5.48828125, -5.18896484375, -4.8896484375, -4.59033203125, -4.291015625, -3.99169921875, -3.6923828125, -3.39306640625, -3.09375, -2.79443359375, -2.4951171875, -2.19580078125, -1.896484375, -1.59716796875, -1.2978515625, -0.99853515625, -0.69921875, -0.39990234375, -0.1005859375, 0.19873046875, 0.498046875, 0.79736328125, 1.0966796875, 1.39599609375, 1.6953125, 1.99462890625, 2.2939453125, 2.59326171875, 2.892578125, 3.19189453125, 3.4912109375, 3.79052734375, 4.08984375, 4.38916015625, 4.6884765625, 4.98779296875, 5.287109375, 5.58642578125, 5.8857421875, 6.18505859375, 6.484375, 6.78369140625, 7.0830078125, 7.38232421875, 7.681640625, 7.98095703125, 8.2802734375, 8.57958984375, 8.87890625, 9.17822265625, 9.4775390625, 9.77685546875, 10.076171875, 10.37548828125, 10.6748046875, 10.97412109375, 11.2734375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 2.0, 10.0, 5.0, 18.0, 11.0, 25.0, 23.0, 30.0, 39.0, 76.0, 113.0, 325.0, 1458.0, 13244.0, 234852.0, 3741986.0, 188763.0, 11433.0, 1256.0, 290.0, 117.0, 67.0, 37.0, 25.0, 19.0, 10.0, 9.0, 12.0, 4.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.5, -33.2880859375, -32.076171875, -30.8642578125, -29.65234375, -28.4404296875, -27.228515625, -26.0166015625, -24.8046875, -23.5927734375, -22.380859375, -21.1689453125, -19.95703125, -18.7451171875, -17.533203125, -16.3212890625, -15.109375, -13.8974609375, -12.685546875, -11.4736328125, -10.26171875, -9.0498046875, -7.837890625, -6.6259765625, -5.4140625, -4.2021484375, -2.990234375, -1.7783203125, -0.56640625, 0.6455078125, 1.857421875, 3.0693359375, 4.28125, 5.4931640625, 6.705078125, 7.9169921875, 9.12890625, 10.3408203125, 11.552734375, 12.7646484375, 13.9765625, 15.1884765625, 16.400390625, 17.6123046875, 18.82421875, 20.0361328125, 21.248046875, 22.4599609375, 23.671875, 24.8837890625, 26.095703125, 27.3076171875, 28.51953125, 29.7314453125, 30.943359375, 32.1552734375, 33.3671875, 34.5791015625, 35.791015625, 37.0029296875, 38.21484375, 39.4267578125, 40.638671875, 41.8505859375, 43.0625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 10.0, 30.0, 36.0, 86.0, 86.0, 141.0, 179.0, 127.0, 113.0, 66.0, 55.0, 35.0, 16.0, 11.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.683807373046875, -33.77377700805664, -31.86374282836914, -29.953710556030273, -28.043678283691406, -26.133647918701172, -24.223613739013672, -22.313583374023438, -20.403549194335938, -18.49351692199707, -16.583484649658203, -14.673452377319336, -12.763420104980469, -10.853388786315918, -8.94335651397705, -7.033324241638184, -5.123292922973633, -3.2132606506347656, -1.3032286167144775, 0.6068034172058105, 2.5168356895446777, 4.426867485046387, 6.336899757385254, 8.246932029724121, 10.156964302062988, 12.066996574401855, 13.977028846740723, 15.887060165405273, 17.79709243774414, 19.707124710083008, 21.617156982421875, 23.527189254760742, 25.43722152709961, 27.347253799438477, 29.257286071777344, 31.16731834411621, 33.07735061645508, 34.98738098144531, 36.89741516113281, 38.80744552612305, 40.71747970581055, 42.62751007080078, 44.53754425048828, 46.447574615478516, 48.357608795166016, 50.26763916015625, 52.17767333984375, 54.087703704833984, 55.99773406982422, 57.90776443481445, 59.81779861450195, 61.72782897949219, 63.63786315917969, 65.54789733886719, 67.45792388916016, 69.36795806884766, 71.27799224853516, 73.18802642822266, 75.09805297851562, 77.00808715820312, 78.91812133789062, 80.82815551757812, 82.7381820678711, 84.6482162475586, 86.5582504272461]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 12.0, 14.0, 14.0, 15.0, 19.0, 13.0, 23.0, 23.0, 18.0, 27.0, 31.0, 43.0, 30.0, 38.0, 37.0, 31.0, 42.0, 40.0, 41.0, 47.0, 41.0, 43.0, 33.0, 37.0, 32.0, 28.0, 34.0, 28.0, 26.0, 22.0, 18.0, 20.0, 13.0, 10.0, 12.0, 8.0, 9.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-31.921844482421875, -30.95384407043457, -29.9858455657959, -29.017845153808594, -28.049846649169922, -27.081846237182617, -26.113845825195312, -25.14584732055664, -24.177846908569336, -23.20984649658203, -22.24184799194336, -21.273847579956055, -20.30584716796875, -19.337848663330078, -18.369848251342773, -17.40184783935547, -16.433849334716797, -15.465849876403809, -14.49785041809082, -13.529850006103516, -12.561850547790527, -11.593851089477539, -10.625850677490234, -9.657851219177246, -8.689851760864258, -7.7218523025512695, -6.753852367401123, -5.785852432250977, -4.817852973937988, -3.849853515625, -2.8818535804748535, -1.913853645324707, -0.9458541870117188, 0.022145509719848633, 0.990145206451416, 1.9581449031829834, 2.926144599914551, 3.894144058227539, 4.8621439933776855, 5.830143928527832, 6.79814338684082, 7.766142845153809, 8.734142303466797, 9.702142715454102, 10.67014217376709, 11.638141632080078, 12.606142044067383, 13.574141502380371, 14.54214096069336, 15.510140419006348, 16.478139877319336, 17.44614028930664, 18.414138793945312, 19.382139205932617, 20.350139617919922, 21.318138122558594, 22.2861385345459, 23.254138946533203, 24.222137451171875, 25.19013786315918, 26.158138275146484, 27.126136779785156, 28.09413719177246, 29.062137603759766, 30.030136108398438]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 2.0, 1.0, 4.0, 8.0, 8.0, 8.0, 12.0, 10.0, 15.0, 14.0, 23.0, 22.0, 34.0, 38.0, 35.0, 31.0, 33.0, 29.0, 49.0, 43.0, 45.0, 37.0, 50.0, 40.0, 37.0, 34.0, 42.0, 35.0, 44.0, 28.0, 25.0, 25.0, 19.0, 19.0, 14.0, 18.0, 12.0, 12.0, 13.0, 4.0, 8.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.671875, -6.476318359375, -6.28076171875, -6.085205078125, -5.8896484375, -5.694091796875, -5.49853515625, -5.302978515625, -5.107421875, -4.911865234375, -4.71630859375, -4.520751953125, -4.3251953125, -4.129638671875, -3.93408203125, -3.738525390625, -3.54296875, -3.347412109375, -3.15185546875, -2.956298828125, -2.7607421875, -2.565185546875, -2.36962890625, -2.174072265625, -1.978515625, -1.782958984375, -1.58740234375, -1.391845703125, -1.1962890625, -1.000732421875, -0.80517578125, -0.609619140625, -0.4140625, -0.218505859375, -0.02294921875, 0.172607421875, 0.3681640625, 0.563720703125, 0.75927734375, 0.954833984375, 1.150390625, 1.345947265625, 1.54150390625, 1.737060546875, 1.9326171875, 2.128173828125, 2.32373046875, 2.519287109375, 2.71484375, 2.910400390625, 3.10595703125, 3.301513671875, 3.4970703125, 3.692626953125, 3.88818359375, 4.083740234375, 4.279296875, 4.474853515625, 4.67041015625, 4.865966796875, 5.0615234375, 5.257080078125, 5.45263671875, 5.648193359375, 5.84375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 6.0, 10.0, 16.0, 27.0, 28.0, 53.0, 64.0, 111.0, 140.0, 231.0, 338.0, 469.0, 725.0, 1069.0, 1555.0, 2322.0, 3518.0, 5220.0, 7994.0, 12243.0, 19130.0, 30769.0, 50513.0, 85257.0, 164507.0, 332812.0, 134878.0, 73796.0, 43841.0, 27232.0, 17075.0, 11039.0, 7129.0, 4771.0, 3213.0, 2088.0, 1373.0, 958.0, 645.0, 450.0, 286.0, 205.0, 158.0, 101.0, 63.0, 40.0, 40.0, 18.0, 11.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.459228515625, -0.4450416564941406, -0.43085479736328125, -0.4166679382324219, -0.4024810791015625, -0.3882942199707031, -0.37410736083984375, -0.3599205017089844, -0.345733642578125, -0.3315467834472656, -0.31735992431640625, -0.3031730651855469, -0.2889862060546875, -0.2747993469238281, -0.26061248779296875, -0.24642562866210938, -0.23223876953125, -0.21805191040039062, -0.20386505126953125, -0.18967819213867188, -0.1754913330078125, -0.16130447387695312, -0.14711761474609375, -0.13293075561523438, -0.118743896484375, -0.10455703735351562, -0.09037017822265625, -0.07618331909179688, -0.0619964599609375, -0.047809600830078125, -0.03362274169921875, -0.019435882568359375, -0.0052490234375, 0.008937835693359375, 0.02312469482421875, 0.037311553955078125, 0.0514984130859375, 0.06568527221679688, 0.07987213134765625, 0.09405899047851562, 0.108245849609375, 0.12243270874023438, 0.13661956787109375, 0.15080642700195312, 0.1649932861328125, 0.17918014526367188, 0.19336700439453125, 0.20755386352539062, 0.22174072265625, 0.23592758178710938, 0.25011444091796875, 0.2643013000488281, 0.2784881591796875, 0.2926750183105469, 0.30686187744140625, 0.3210487365722656, 0.335235595703125, 0.3494224548339844, 0.36360931396484375, 0.3777961730957031, 0.3919830322265625, 0.4061698913574219, 0.42035675048828125, 0.4345436096191406, 0.44873046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 4.0, 6.0, 10.0, 3.0, 10.0, 6.0, 17.0, 14.0, 14.0, 16.0, 21.0, 31.0, 23.0, 24.0, 32.0, 24.0, 37.0, 20.0, 45.0, 41.0, 25.0, 44.0, 1068.0, 38.0, 34.0, 40.0, 35.0, 39.0, 30.0, 30.0, 25.0, 28.0, 26.0, 19.0, 18.0, 22.0, 16.0, 15.0, 10.0, 10.0, 6.0, 13.0, 12.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.37109375, -4.237060546875, -4.10302734375, -3.968994140625, -3.8349609375, -3.700927734375, -3.56689453125, -3.432861328125, -3.298828125, -3.164794921875, -3.03076171875, -2.896728515625, -2.7626953125, -2.628662109375, -2.49462890625, -2.360595703125, -2.2265625, -2.092529296875, -1.95849609375, -1.824462890625, -1.6904296875, -1.556396484375, -1.42236328125, -1.288330078125, -1.154296875, -1.020263671875, -0.88623046875, -0.752197265625, -0.6181640625, -0.484130859375, -0.35009765625, -0.216064453125, -0.08203125, 0.052001953125, 0.18603515625, 0.320068359375, 0.4541015625, 0.588134765625, 0.72216796875, 0.856201171875, 0.990234375, 1.124267578125, 1.25830078125, 1.392333984375, 1.5263671875, 1.660400390625, 1.79443359375, 1.928466796875, 2.0625, 2.196533203125, 2.33056640625, 2.464599609375, 2.5986328125, 2.732666015625, 2.86669921875, 3.000732421875, 3.134765625, 3.268798828125, 3.40283203125, 3.536865234375, 3.6708984375, 3.804931640625, 3.93896484375, 4.072998046875, 4.20703125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 8.0, 11.0, 14.0, 28.0, 50.0, 65.0, 81.0, 109.0, 176.0, 251.0, 323.0, 522.0, 756.0, 1033.0, 1460.0, 2251.0, 3337.0, 4721.0, 7346.0, 11172.0, 17148.0, 27618.0, 45887.0, 81114.0, 169098.0, 1406324.0, 136085.0, 69546.0, 40226.0, 24525.0, 15441.0, 9894.0, 6528.0, 4471.0, 2879.0, 2092.0, 1375.0, 960.0, 647.0, 465.0, 330.0, 230.0, 179.0, 111.0, 60.0, 53.0, 42.0, 26.0, 15.0, 19.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.281005859375, -0.2720489501953125, -0.263092041015625, -0.2541351318359375, -0.24517822265625, -0.2362213134765625, -0.227264404296875, -0.2183074951171875, -0.2093505859375, -0.2003936767578125, -0.191436767578125, -0.1824798583984375, -0.17352294921875, -0.1645660400390625, -0.155609130859375, -0.1466522216796875, -0.1376953125, -0.1287384033203125, -0.119781494140625, -0.1108245849609375, -0.10186767578125, -0.0929107666015625, -0.083953857421875, -0.0749969482421875, -0.0660400390625, -0.0570831298828125, -0.048126220703125, -0.0391693115234375, -0.03021240234375, -0.0212554931640625, -0.012298583984375, -0.0033416748046875, 0.005615234375, 0.0145721435546875, 0.023529052734375, 0.0324859619140625, 0.04144287109375, 0.0503997802734375, 0.059356689453125, 0.0683135986328125, 0.0772705078125, 0.0862274169921875, 0.095184326171875, 0.1041412353515625, 0.11309814453125, 0.1220550537109375, 0.131011962890625, 0.1399688720703125, 0.14892578125, 0.1578826904296875, 0.166839599609375, 0.1757965087890625, 0.18475341796875, 0.1937103271484375, 0.202667236328125, 0.2116241455078125, 0.2205810546875, 0.2295379638671875, 0.238494873046875, 0.2474517822265625, 0.25640869140625, 0.2653656005859375, 0.274322509765625, 0.2832794189453125, 0.292236328125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 7.0, 1.0, 6.0, 2.0, 9.0, 8.0, 10.0, 20.0, 10.0, 17.0, 25.0, 39.0, 43.0, 51.0, 79.0, 142.0, 122.0, 102.0, 72.0, 48.0, 43.0, 23.0, 29.0, 23.0, 18.0, 8.0, 10.0, 10.0, 3.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0325183868408203e-05, -1.9606202840805054e-05, -1.8887221813201904e-05, -1.8168240785598755e-05, -1.7449259757995605e-05, -1.6730278730392456e-05, -1.6011297702789307e-05, -1.5292316675186157e-05, -1.4573335647583008e-05, -1.3854354619979858e-05, -1.3135373592376709e-05, -1.241639256477356e-05, -1.169741153717041e-05, -1.097843050956726e-05, -1.0259449481964111e-05, -9.540468454360962e-06, -8.821487426757812e-06, -8.102506399154663e-06, -7.383525371551514e-06, -6.664544343948364e-06, -5.945563316345215e-06, -5.2265822887420654e-06, -4.507601261138916e-06, -3.7886202335357666e-06, -3.069639205932617e-06, -2.3506581783294678e-06, -1.6316771507263184e-06, -9.126961231231689e-07, -1.9371509552001953e-07, 5.252659320831299e-07, 1.2442469596862793e-06, 1.9632279872894287e-06, 2.682209014892578e-06, 3.4011900424957275e-06, 4.120171070098877e-06, 4.839152097702026e-06, 5.558133125305176e-06, 6.277114152908325e-06, 6.996095180511475e-06, 7.715076208114624e-06, 8.434057235717773e-06, 9.153038263320923e-06, 9.872019290924072e-06, 1.0591000318527222e-05, 1.1309981346130371e-05, 1.202896237373352e-05, 1.274794340133667e-05, 1.346692442893982e-05, 1.4185905456542969e-05, 1.4904886484146118e-05, 1.5623867511749268e-05, 1.6342848539352417e-05, 1.7061829566955566e-05, 1.7780810594558716e-05, 1.8499791622161865e-05, 1.9218772649765015e-05, 1.9937753677368164e-05, 2.0656734704971313e-05, 2.1375715732574463e-05, 2.2094696760177612e-05, 2.2813677787780762e-05, 2.353265881538391e-05, 2.425163984298706e-05, 2.497062087059021e-05, 2.568960189819336e-05]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 5.0, 4.0, 16.0, 9.0, 16.0, 15.0, 29.0, 41.0, 72.0, 83.0, 143.0, 233.0, 588.0, 5267.0, 188766.0, 834358.0, 17029.0, 1063.0, 322.0, 168.0, 85.0, 60.0, 45.0, 37.0, 20.0, 21.0, 13.0, 10.0, 4.0, 8.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004494190216064453, -0.0004362724721431732, -0.0004231259226799011, -0.00040997937321662903, -0.00039683282375335693, -0.00038368627429008484, -0.00037053972482681274, -0.00035739317536354065, -0.00034424662590026855, -0.00033110007643699646, -0.00031795352697372437, -0.00030480697751045227, -0.0002916604280471802, -0.0002785138785839081, -0.000265367329120636, -0.0002522207796573639, -0.0002390742301940918, -0.0002259276807308197, -0.0002127811312675476, -0.0001996345818042755, -0.00018648803234100342, -0.00017334148287773132, -0.00016019493341445923, -0.00014704838395118713, -0.00013390183448791504, -0.00012075528502464294, -0.00010760873556137085, -9.446218609809875e-05, -8.131563663482666e-05, -6.816908717155457e-05, -5.502253770828247e-05, -4.1875988245010376e-05, -2.872943878173828e-05, -1.5582889318466187e-05, -2.436339855194092e-06, 1.0710209608078003e-05, 2.3856759071350098e-05, 3.700330853462219e-05, 5.014985799789429e-05, 6.329640746116638e-05, 7.644295692443848e-05, 8.958950638771057e-05, 0.00010273605585098267, 0.00011588260531425476, 0.00012902915477752686, 0.00014217570424079895, 0.00015532225370407104, 0.00016846880316734314, 0.00018161535263061523, 0.00019476190209388733, 0.00020790845155715942, 0.00022105500102043152, 0.0002342015504837036, 0.0002473480999469757, 0.0002604946494102478, 0.0002736411988735199, 0.000286787748336792, 0.0002999342978000641, 0.0003130808472633362, 0.0003262273967266083, 0.00033937394618988037, 0.00035252049565315247, 0.00036566704511642456, 0.00037881359457969666, 0.00039196014404296875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 9.0, 15.0, 19.0, 40.0, 43.0, 80.0, 124.0, 128.0, 134.0, 126.0, 101.0, 64.0, 47.0, 25.0, 13.0, 15.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4460195416177157e-05, -1.3707663129025605e-05, -1.2955130841874052e-05, -1.2202599464217201e-05, -1.1450067177065648e-05, -1.0697534889914095e-05, -9.945002602762543e-06, -9.19247031561099e-06, -8.439938028459437e-06, -7.687405741307884e-06, -6.934873454156332e-06, -6.18234162175213e-06, -5.429809334600577e-06, -4.677277047449024e-06, -3.9247452150448225e-06, -3.17221292789327e-06, -2.419680640741717e-06, -1.667148467277002e-06, -9.14616293812287e-07, -1.6208423403440975e-07, 5.90448053117143e-07, 1.3429803402686957e-06, 2.0955121726728976e-06, 2.8480444598244503e-06, 3.600576746976003e-06, 4.353109034127556e-06, 5.1056413212791085e-06, 5.85817315368331e-06, 6.610705440834863e-06, 7.363237727986416e-06, 8.115769560390618e-06, 8.86830184754217e-06, 9.620835044188425e-06, 1.0373367331339978e-05, 1.112589961849153e-05, 1.1878431905643083e-05, 1.2630964192794636e-05, 1.3383496479946189e-05, 1.413602785760304e-05, 1.4888560144754592e-05, 1.5641093341400847e-05, 1.63936256285524e-05, 1.7146157915703952e-05, 1.7898690202855505e-05, 1.8651222490007058e-05, 1.940375477715861e-05, 2.0156287064310163e-05, 2.0908817532472312e-05, 2.1661349819623865e-05, 2.2413882106775418e-05, 2.316641439392697e-05, 2.3918946681078523e-05, 2.4671478968230076e-05, 2.542401125538163e-05, 2.6176541723543778e-05, 2.6929075829684734e-05, 2.7681606297846884e-05, 2.8434138584998436e-05, 2.918667087214999e-05, 2.9939203159301542e-05, 3.0691735446453094e-05, 3.1444265914615244e-05, 3.21968000207562e-05, 3.294933048891835e-05, 3.3701864595059305e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 5.0, 4.0, 13.0, 10.0, 12.0, 23.0, 18.0, 23.0, 20.0, 26.0, 38.0, 37.0, 35.0, 49.0, 40.0, 38.0, 42.0, 49.0, 30.0, 45.0, 41.0, 45.0, 36.0, 44.0, 36.0, 21.0, 23.0, 29.0, 31.0, 22.0, 16.0, 19.0, 9.0, 8.0, 14.0, 5.0, 13.0, 1.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.827075362205505e-06, -8.534640073776245e-06, -8.242204785346985e-06, -7.949769496917725e-06, -7.657334208488464e-06, -7.364898920059204e-06, -7.072463631629944e-06, -6.780028343200684e-06, -6.487593054771423e-06, -6.195157766342163e-06, -5.902722477912903e-06, -5.610287189483643e-06, -5.317851901054382e-06, -5.025416612625122e-06, -4.732981324195862e-06, -4.4405460357666016e-06, -4.148110747337341e-06, -3.855675458908081e-06, -3.563240170478821e-06, -3.2708048820495605e-06, -2.9783695936203003e-06, -2.68593430519104e-06, -2.3934990167617798e-06, -2.1010637283325195e-06, -1.8086284399032593e-06, -1.516193151473999e-06, -1.2237578630447388e-06, -9.313225746154785e-07, -6.388872861862183e-07, -3.46451997756958e-07, -5.4016709327697754e-08, 2.384185791015625e-07, 5.308538675308228e-07, 8.23289155960083e-07, 1.1157244443893433e-06, 1.4081597328186035e-06, 1.7005950212478638e-06, 1.993030309677124e-06, 2.2854655981063843e-06, 2.5779008865356445e-06, 2.8703361749649048e-06, 3.162771463394165e-06, 3.4552067518234253e-06, 3.7476420402526855e-06, 4.040077328681946e-06, 4.332512617111206e-06, 4.624947905540466e-06, 4.9173831939697266e-06, 5.209818482398987e-06, 5.502253770828247e-06, 5.794689059257507e-06, 6.087124347686768e-06, 6.379559636116028e-06, 6.671994924545288e-06, 6.964430212974548e-06, 7.256865501403809e-06, 7.549300789833069e-06, 7.841736078262329e-06, 8.13417136669159e-06, 8.42660665512085e-06, 8.71904194355011e-06, 9.01147723197937e-06, 9.30391252040863e-06, 9.59634780883789e-06]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 2.0, 1.0, 4.0, 8.0, 8.0, 8.0, 12.0, 10.0, 15.0, 14.0, 23.0, 22.0, 34.0, 38.0, 35.0, 31.0, 33.0, 29.0, 49.0, 43.0, 45.0, 37.0, 50.0, 40.0, 37.0, 34.0, 42.0, 35.0, 44.0, 28.0, 25.0, 25.0, 19.0, 19.0, 14.0, 18.0, 12.0, 12.0, 13.0, 4.0, 8.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.671875, -6.476318359375, -6.28076171875, -6.085205078125, -5.8896484375, -5.694091796875, -5.49853515625, -5.302978515625, -5.107421875, -4.911865234375, -4.71630859375, -4.520751953125, -4.3251953125, -4.129638671875, -3.93408203125, -3.738525390625, -3.54296875, -3.347412109375, -3.15185546875, -2.956298828125, -2.7607421875, -2.565185546875, -2.36962890625, -2.174072265625, -1.978515625, -1.782958984375, -1.58740234375, -1.391845703125, -1.1962890625, -1.000732421875, -0.80517578125, -0.609619140625, -0.4140625, -0.218505859375, -0.02294921875, 0.172607421875, 0.3681640625, 0.563720703125, 0.75927734375, 0.954833984375, 1.150390625, 1.345947265625, 1.54150390625, 1.737060546875, 1.9326171875, 2.128173828125, 2.32373046875, 2.519287109375, 2.71484375, 2.910400390625, 3.10595703125, 3.301513671875, 3.4970703125, 3.692626953125, 3.88818359375, 4.083740234375, 4.279296875, 4.474853515625, 4.67041015625, 4.865966796875, 5.0615234375, 5.257080078125, 5.45263671875, 5.648193359375, 5.84375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 14.0, 17.0, 28.0, 33.0, 42.0, 59.0, 94.0, 136.0, 191.0, 257.0, 350.0, 539.0, 771.0, 1256.0, 1863.0, 3194.0, 5293.0, 9738.0, 17715.0, 33919.0, 65580.0, 125567.0, 214829.0, 237360.0, 154323.0, 82559.0, 42186.0, 22279.0, 11722.0, 6434.0, 3671.0, 2262.0, 1362.0, 908.0, 609.0, 417.0, 308.0, 201.0, 140.0, 107.0, 70.0, 56.0, 38.0, 18.0, 13.0, 10.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.88861083984375, -5.6795654296875, -5.47052001953125, -5.261474609375, -5.05242919921875, -4.8433837890625, -4.63433837890625, -4.42529296875, -4.21624755859375, -4.0072021484375, -3.79815673828125, -3.589111328125, -3.38006591796875, -3.1710205078125, -2.96197509765625, -2.7529296875, -2.54388427734375, -2.3348388671875, -2.12579345703125, -1.916748046875, -1.70770263671875, -1.4986572265625, -1.28961181640625, -1.08056640625, -0.87152099609375, -0.6624755859375, -0.45343017578125, -0.244384765625, -0.03533935546875, 0.1737060546875, 0.38275146484375, 0.591796875, 0.80084228515625, 1.0098876953125, 1.21893310546875, 1.427978515625, 1.63702392578125, 1.8460693359375, 2.05511474609375, 2.26416015625, 2.47320556640625, 2.6822509765625, 2.89129638671875, 3.100341796875, 3.30938720703125, 3.5184326171875, 3.72747802734375, 3.9365234375, 4.14556884765625, 4.3546142578125, 4.56365966796875, 4.772705078125, 4.98175048828125, 5.1907958984375, 5.39984130859375, 5.60888671875, 5.81793212890625, 6.0269775390625, 6.23602294921875, 6.445068359375, 6.65411376953125, 6.8631591796875, 7.07220458984375, 7.28125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 2.0, 3.0, 7.0, 6.0, 9.0, 10.0, 15.0, 16.0, 17.0, 18.0, 18.0, 35.0, 35.0, 27.0, 48.0, 55.0, 88.0, 119.0, 190.0, 1344.0, 284.0, 183.0, 102.0, 65.0, 44.0, 42.0, 48.0, 39.0, 27.0, 23.0, 21.0, 18.0, 17.0, 14.0, 16.0, 12.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2476806640625, -13.737548828125, -13.2274169921875, -12.71728515625, -12.2071533203125, -11.697021484375, -11.1868896484375, -10.6767578125, -10.1666259765625, -9.656494140625, -9.1463623046875, -8.63623046875, -8.1260986328125, -7.615966796875, -7.1058349609375, -6.595703125, -6.0855712890625, -5.575439453125, -5.0653076171875, -4.55517578125, -4.0450439453125, -3.534912109375, -3.0247802734375, -2.5146484375, -2.0045166015625, -1.494384765625, -0.9842529296875, -0.47412109375, 0.0360107421875, 0.546142578125, 1.0562744140625, 1.56640625, 2.0765380859375, 2.586669921875, 3.0968017578125, 3.60693359375, 4.1170654296875, 4.627197265625, 5.1373291015625, 5.6474609375, 6.1575927734375, 6.667724609375, 7.1778564453125, 7.68798828125, 8.1981201171875, 8.708251953125, 9.2183837890625, 9.728515625, 10.2386474609375, 10.748779296875, 11.2589111328125, 11.76904296875, 12.2791748046875, 12.789306640625, 13.2994384765625, 13.8095703125, 14.3197021484375, 14.829833984375, 15.3399658203125, 15.85009765625, 16.3602294921875, 16.870361328125, 17.3804931640625, 17.890625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 4.0, 8.0, 10.0, 20.0, 22.0, 26.0, 47.0, 66.0, 101.0, 120.0, 218.0, 406.0, 802.0, 2304.0, 51903.0, 3017078.0, 68170.0, 2546.0, 772.0, 405.0, 238.0, 141.0, 83.0, 50.0, 42.0, 26.0, 20.0, 21.0, 14.0, 16.0, 4.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.4375, -35.11376953125, -33.7900390625, -32.46630859375, -31.142578125, -29.81884765625, -28.4951171875, -27.17138671875, -25.84765625, -24.52392578125, -23.2001953125, -21.87646484375, -20.552734375, -19.22900390625, -17.9052734375, -16.58154296875, -15.2578125, -13.93408203125, -12.6103515625, -11.28662109375, -9.962890625, -8.63916015625, -7.3154296875, -5.99169921875, -4.66796875, -3.34423828125, -2.0205078125, -0.69677734375, 0.626953125, 1.95068359375, 3.2744140625, 4.59814453125, 5.921875, 7.24560546875, 8.5693359375, 9.89306640625, 11.216796875, 12.54052734375, 13.8642578125, 15.18798828125, 16.51171875, 17.83544921875, 19.1591796875, 20.48291015625, 21.806640625, 23.13037109375, 24.4541015625, 25.77783203125, 27.1015625, 28.42529296875, 29.7490234375, 31.07275390625, 32.396484375, 33.72021484375, 35.0439453125, 36.36767578125, 37.69140625, 39.01513671875, 40.3388671875, 41.66259765625, 42.986328125, 44.31005859375, 45.6337890625, 46.95751953125, 48.28125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 124.0, 444.0, 350.0, 73.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-354.2718811035156, -347.1657409667969, -340.05963134765625, -332.9534912109375, -325.84735107421875, -318.7412414550781, -311.6351013183594, -304.52899169921875, -297.4228515625, -290.31671142578125, -283.2106018066406, -276.1044616699219, -268.9983215332031, -261.8922119140625, -254.78607177734375, -247.67994689941406, -240.57382202148438, -233.4676971435547, -226.36155700683594, -219.25543212890625, -212.14930725097656, -205.04318237304688, -197.93704223632812, -190.83091735839844, -183.7247772216797, -176.61865234375, -169.51251220703125, -162.40638732910156, -155.30026245117188, -148.19412231445312, -141.08799743652344, -133.98187255859375, -126.87574005126953, -119.76960754394531, -112.66348266601562, -105.5573501586914, -98.45122528076172, -91.3450927734375, -84.23896789550781, -77.1328353881836, -70.02670288085938, -62.92057418823242, -55.81444549560547, -48.70831298828125, -41.60218811035156, -34.496055603027344, -27.38992691040039, -20.283798217773438, -13.17767333984375, -6.071544170379639, 1.0345849990844727, 8.140714645385742, 15.246843338012695, 22.35297393798828, 29.459102630615234, 36.56523132324219, 43.67136001586914, 50.777488708496094, 57.88361740112305, 64.98974609375, 72.09587860107422, 79.20201110839844, 86.30813598632812, 93.41426086425781, 100.52039337158203]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 8.0, 12.0, 12.0, 13.0, 10.0, 13.0, 26.0, 25.0, 36.0, 27.0, 32.0, 34.0, 44.0, 51.0, 48.0, 45.0, 40.0, 57.0, 48.0, 34.0, 55.0, 46.0, 34.0, 25.0, 29.0, 30.0, 31.0, 23.0, 20.0, 23.0, 10.0, 18.0, 10.0, 6.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.68825912475586, -49.927608489990234, -48.166961669921875, -46.40631103515625, -44.645660400390625, -42.885013580322266, -41.12436294555664, -39.36371612548828, -37.603065490722656, -35.84241485595703, -34.08176803588867, -32.32111740112305, -30.560468673706055, -28.799819946289062, -27.039169311523438, -25.278520584106445, -23.517871856689453, -21.75722312927246, -19.99657440185547, -18.235923767089844, -16.47527503967285, -14.71462631225586, -12.95397663116455, -11.193326950073242, -9.43267822265625, -7.6720290184021, -5.911379814147949, -4.150730609893799, -2.3900814056396484, -0.6294326782226562, 1.1312170028686523, 2.891866683959961, 4.652519226074219, 6.413168430328369, 8.17381763458252, 9.934467315673828, 11.69511604309082, 13.455764770507812, 15.216414451599121, 16.97706413269043, 18.737712860107422, 20.498361587524414, 22.259010314941406, 24.01966094970703, 25.780309677124023, 27.540958404541016, 29.30160903930664, 31.062257766723633, 32.822906494140625, 34.58355712890625, 36.34420394897461, 38.104854583740234, 39.865501403808594, 41.62615203857422, 43.386802673339844, 45.14745330810547, 46.90810012817383, 48.66875076293945, 50.42939758300781, 52.19004821777344, 53.95069885253906, 55.71134567260742, 57.47199630737305, 59.232643127441406, 60.99329376220703]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 4.0, 7.0, 14.0, 15.0, 11.0, 24.0, 30.0, 28.0, 26.0, 33.0, 46.0, 38.0, 32.0, 42.0, 39.0, 40.0, 53.0, 40.0, 33.0, 33.0, 51.0, 41.0, 35.0, 38.0, 24.0, 27.0, 26.0, 20.0, 23.0, 17.0, 14.0, 15.0, 22.0, 6.0, 9.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.76171875, -6.5579833984375, -6.354248046875, -6.1505126953125, -5.94677734375, -5.7430419921875, -5.539306640625, -5.3355712890625, -5.1318359375, -4.9281005859375, -4.724365234375, -4.5206298828125, -4.31689453125, -4.1131591796875, -3.909423828125, -3.7056884765625, -3.501953125, -3.2982177734375, -3.094482421875, -2.8907470703125, -2.68701171875, -2.4832763671875, -2.279541015625, -2.0758056640625, -1.8720703125, -1.6683349609375, -1.464599609375, -1.2608642578125, -1.05712890625, -0.8533935546875, -0.649658203125, -0.4459228515625, -0.2421875, -0.0384521484375, 0.165283203125, 0.3690185546875, 0.57275390625, 0.7764892578125, 0.980224609375, 1.1839599609375, 1.3876953125, 1.5914306640625, 1.795166015625, 1.9989013671875, 2.20263671875, 2.4063720703125, 2.610107421875, 2.8138427734375, 3.017578125, 3.2213134765625, 3.425048828125, 3.6287841796875, 3.83251953125, 4.0362548828125, 4.239990234375, 4.4437255859375, 4.6474609375, 4.8511962890625, 5.054931640625, 5.2586669921875, 5.46240234375, 5.6661376953125, 5.869873046875, 6.0736083984375, 6.27734375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 7.0, 9.0, 10.0, 11.0, 12.0, 27.0, 62.0, 63.0, 85.0, 123.0, 205.0, 298.0, 484.0, 657.0, 1099.0, 1671.0, 2729.0, 4552.0, 7986.0, 15229.0, 31978.0, 84293.0, 342342.0, 1622973.0, 1598144.0, 330169.0, 82014.0, 32018.0, 15271.0, 7942.0, 4387.0, 2646.0, 1673.0, 1025.0, 674.0, 446.0, 321.0, 233.0, 120.0, 91.0, 75.0, 47.0, 24.0, 22.0, 11.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-12.3359375, -11.9833984375, -11.630859375, -11.2783203125, -10.92578125, -10.5732421875, -10.220703125, -9.8681640625, -9.515625, -9.1630859375, -8.810546875, -8.4580078125, -8.10546875, -7.7529296875, -7.400390625, -7.0478515625, -6.6953125, -6.3427734375, -5.990234375, -5.6376953125, -5.28515625, -4.9326171875, -4.580078125, -4.2275390625, -3.875, -3.5224609375, -3.169921875, -2.8173828125, -2.46484375, -2.1123046875, -1.759765625, -1.4072265625, -1.0546875, -0.7021484375, -0.349609375, 0.0029296875, 0.35546875, 0.7080078125, 1.060546875, 1.4130859375, 1.765625, 2.1181640625, 2.470703125, 2.8232421875, 3.17578125, 3.5283203125, 3.880859375, 4.2333984375, 4.5859375, 4.9384765625, 5.291015625, 5.6435546875, 5.99609375, 6.3486328125, 6.701171875, 7.0537109375, 7.40625, 7.7587890625, 8.111328125, 8.4638671875, 8.81640625, 9.1689453125, 9.521484375, 9.8740234375, 10.2265625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 13.0, 18.0, 23.0, 28.0, 52.0, 68.0, 120.0, 222.0, 354.0, 600.0, 859.0, 659.0, 396.0, 283.0, 119.0, 92.0, 60.0, 29.0, 20.0, 10.0, 11.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.390625, -14.88720703125, -14.3837890625, -13.88037109375, -13.376953125, -12.87353515625, -12.3701171875, -11.86669921875, -11.36328125, -10.85986328125, -10.3564453125, -9.85302734375, -9.349609375, -8.84619140625, -8.3427734375, -7.83935546875, -7.3359375, -6.83251953125, -6.3291015625, -5.82568359375, -5.322265625, -4.81884765625, -4.3154296875, -3.81201171875, -3.30859375, -2.80517578125, -2.3017578125, -1.79833984375, -1.294921875, -0.79150390625, -0.2880859375, 0.21533203125, 0.71875, 1.22216796875, 1.7255859375, 2.22900390625, 2.732421875, 3.23583984375, 3.7392578125, 4.24267578125, 4.74609375, 5.24951171875, 5.7529296875, 6.25634765625, 6.759765625, 7.26318359375, 7.7666015625, 8.27001953125, 8.7734375, 9.27685546875, 9.7802734375, 10.28369140625, 10.787109375, 11.29052734375, 11.7939453125, 12.29736328125, 12.80078125, 13.30419921875, 13.8076171875, 14.31103515625, 14.814453125, 15.31787109375, 15.8212890625, 16.32470703125, 16.828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 2.0, 11.0, 15.0, 21.0, 24.0, 30.0, 53.0, 69.0, 96.0, 154.0, 235.0, 403.0, 649.0, 1281.0, 2741.0, 6780.0, 23079.0, 138415.0, 2260006.0, 1618290.0, 110718.0, 20048.0, 5971.0, 2341.0, 1132.0, 637.0, 370.0, 214.0, 128.0, 112.0, 69.0, 60.0, 33.0, 29.0, 17.0, 10.0, 7.0, 17.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.453125, -23.7109375, -22.96875, -22.2265625, -21.484375, -20.7421875, -20.0, -19.2578125, -18.515625, -17.7734375, -17.03125, -16.2890625, -15.546875, -14.8046875, -14.0625, -13.3203125, -12.578125, -11.8359375, -11.09375, -10.3515625, -9.609375, -8.8671875, -8.125, -7.3828125, -6.640625, -5.8984375, -5.15625, -4.4140625, -3.671875, -2.9296875, -2.1875, -1.4453125, -0.703125, 0.0390625, 0.78125, 1.5234375, 2.265625, 3.0078125, 3.75, 4.4921875, 5.234375, 5.9765625, 6.71875, 7.4609375, 8.203125, 8.9453125, 9.6875, 10.4296875, 11.171875, 11.9140625, 12.65625, 13.3984375, 14.140625, 14.8828125, 15.625, 16.3671875, 17.109375, 17.8515625, 18.59375, 19.3359375, 20.078125, 20.8203125, 21.5625, 22.3046875, 23.046875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 301.0, 661.0, 45.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-593.8287353515625, -578.2841186523438, -562.739501953125, -547.1948852539062, -531.6502685546875, -516.1056518554688, -500.5610046386719, -485.0163879394531, -469.4717712402344, -453.9271545410156, -438.3825378417969, -422.8379211425781, -407.29327392578125, -391.7486572265625, -376.20404052734375, -360.659423828125, -345.11480712890625, -329.5701904296875, -314.02557373046875, -298.48095703125, -282.93634033203125, -267.3917236328125, -251.84707641601562, -236.30245971679688, -220.75784301757812, -205.21322631835938, -189.66860961914062, -174.1239776611328, -158.57936096191406, -143.0347442626953, -127.49011993408203, -111.94549560546875, -96.40090942382812, -80.85629272460938, -65.3116683959961, -49.76704788208008, -34.22242736816406, -18.677810668945312, -3.1331863403320312, 12.41143798828125, 27.9560546875, 43.500675201416016, 59.04529571533203, 74.58992004394531, 90.13453674316406, 105.67915344238281, 121.2237777709961, 136.76840209960938, 152.31301879882812, 167.85763549804688, 183.40225219726562, 198.94688415527344, 214.4915008544922, 230.03611755371094, 245.58074951171875, 261.1253662109375, 276.66998291015625, 292.214599609375, 307.75921630859375, 323.3038330078125, 338.84844970703125, 354.39306640625, 369.9377136230469, 385.4823303222656, 401.0269470214844]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 10.0, 12.0, 17.0, 14.0, 13.0, 28.0, 23.0, 32.0, 37.0, 29.0, 29.0, 39.0, 34.0, 48.0, 44.0, 49.0, 43.0, 35.0, 48.0, 43.0, 36.0, 42.0, 37.0, 32.0, 36.0, 26.0, 29.0, 16.0, 14.0, 22.0, 14.0, 12.0, 8.0, 10.0, 6.0, 6.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.862548828125, -36.55066680908203, -35.2387809753418, -33.92689514160156, -32.615013122558594, -31.303129196166992, -29.99124526977539, -28.67936134338379, -27.367477416992188, -26.055593490600586, -24.743709564208984, -23.431825637817383, -22.11994171142578, -20.80805778503418, -19.496173858642578, -18.184289932250977, -16.872406005859375, -15.560522079467773, -14.248638153076172, -12.93675422668457, -11.624870300292969, -10.312986373901367, -9.001102447509766, -7.689218521118164, -6.3773345947265625, -5.065450668334961, -3.7535667419433594, -2.441682815551758, -1.1297988891601562, 0.1820850372314453, 1.4939689636230469, 2.8058528900146484, 4.11773681640625, 5.429620742797852, 6.741504669189453, 8.053388595581055, 9.365272521972656, 10.677156448364258, 11.98904037475586, 13.300924301147461, 14.612808227539062, 15.924692153930664, 17.236576080322266, 18.548460006713867, 19.86034393310547, 21.17222785949707, 22.484111785888672, 23.795995712280273, 25.107879638671875, 26.419763565063477, 27.731647491455078, 29.04353141784668, 30.35541534423828, 31.667299270629883, 32.979183197021484, 34.29106903076172, 35.60295104980469, 36.914833068847656, 38.22671890258789, 39.538604736328125, 40.850486755371094, 42.16236877441406, 43.4742546081543, 44.78614044189453, 46.0980224609375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 8.0, 8.0, 6.0, 13.0, 11.0, 24.0, 17.0, 14.0, 28.0, 21.0, 31.0, 35.0, 40.0, 42.0, 37.0, 33.0, 42.0, 45.0, 35.0, 46.0, 38.0, 34.0, 36.0, 30.0, 36.0, 35.0, 39.0, 31.0, 26.0, 18.0, 18.0, 22.0, 17.0, 22.0, 10.0, 9.0, 8.0, 5.0, 4.0, 7.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.4140625, -7.2025146484375, -6.990966796875, -6.7794189453125, -6.56787109375, -6.3563232421875, -6.144775390625, -5.9332275390625, -5.7216796875, -5.5101318359375, -5.298583984375, -5.0870361328125, -4.87548828125, -4.6639404296875, -4.452392578125, -4.2408447265625, -4.029296875, -3.8177490234375, -3.606201171875, -3.3946533203125, -3.18310546875, -2.9715576171875, -2.760009765625, -2.5484619140625, -2.3369140625, -2.1253662109375, -1.913818359375, -1.7022705078125, -1.49072265625, -1.2791748046875, -1.067626953125, -0.8560791015625, -0.64453125, -0.4329833984375, -0.221435546875, -0.0098876953125, 0.20166015625, 0.4132080078125, 0.624755859375, 0.8363037109375, 1.0478515625, 1.2593994140625, 1.470947265625, 1.6824951171875, 1.89404296875, 2.1055908203125, 2.317138671875, 2.5286865234375, 2.740234375, 2.9517822265625, 3.163330078125, 3.3748779296875, 3.58642578125, 3.7979736328125, 4.009521484375, 4.2210693359375, 4.4326171875, 4.6441650390625, 4.855712890625, 5.0672607421875, 5.27880859375, 5.4903564453125, 5.701904296875, 5.9134521484375, 6.125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 13.0, 27.0, 27.0, 37.0, 71.0, 109.0, 142.0, 217.0, 365.0, 527.0, 810.0, 1306.0, 2006.0, 3308.0, 5093.0, 8110.0, 13169.0, 21503.0, 36406.0, 64005.0, 124215.0, 353014.0, 200992.0, 89754.0, 49316.0, 28472.0, 17134.0, 10459.0, 6498.0, 4251.0, 2554.0, 1612.0, 1070.0, 693.0, 447.0, 278.0, 194.0, 110.0, 65.0, 55.0, 41.0, 24.0, 15.0, 14.0, 9.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7685546875, -0.7457962036132812, -0.7230377197265625, -0.7002792358398438, -0.677520751953125, -0.6547622680664062, -0.6320037841796875, -0.6092453002929688, -0.58648681640625, -0.5637283325195312, -0.5409698486328125, -0.5182113647460938, -0.495452880859375, -0.47269439697265625, -0.4499359130859375, -0.42717742919921875, -0.4044189453125, -0.38166046142578125, -0.3589019775390625, -0.33614349365234375, -0.313385009765625, -0.29062652587890625, -0.2678680419921875, -0.24510955810546875, -0.22235107421875, -0.19959259033203125, -0.1768341064453125, -0.15407562255859375, -0.131317138671875, -0.10855865478515625, -0.0858001708984375, -0.06304168701171875, -0.040283203125, -0.01752471923828125, 0.0052337646484375, 0.02799224853515625, 0.050750732421875, 0.07350921630859375, 0.0962677001953125, 0.11902618408203125, 0.14178466796875, 0.16454315185546875, 0.1873016357421875, 0.21006011962890625, 0.232818603515625, 0.25557708740234375, 0.2783355712890625, 0.30109405517578125, 0.3238525390625, 0.34661102294921875, 0.3693695068359375, 0.39212799072265625, 0.414886474609375, 0.43764495849609375, 0.4604034423828125, 0.48316192626953125, 0.50592041015625, 0.5286788940429688, 0.5514373779296875, 0.5741958618164062, 0.596954345703125, 0.6197128295898438, 0.6424713134765625, 0.6652297973632812, 0.68798828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 12.0, 12.0, 10.0, 14.0, 14.0, 26.0, 25.0, 21.0, 24.0, 35.0, 39.0, 35.0, 36.0, 43.0, 50.0, 44.0, 52.0, 1065.0, 42.0, 41.0, 40.0, 41.0, 42.0, 31.0, 35.0, 23.0, 22.0, 28.0, 22.0, 17.0, 12.0, 19.0, 12.0, 9.0, 4.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.7957763671875, -4.607177734375, -4.4185791015625, -4.22998046875, -4.0413818359375, -3.852783203125, -3.6641845703125, -3.4755859375, -3.2869873046875, -3.098388671875, -2.9097900390625, -2.72119140625, -2.5325927734375, -2.343994140625, -2.1553955078125, -1.966796875, -1.7781982421875, -1.589599609375, -1.4010009765625, -1.21240234375, -1.0238037109375, -0.835205078125, -0.6466064453125, -0.4580078125, -0.2694091796875, -0.080810546875, 0.1077880859375, 0.29638671875, 0.4849853515625, 0.673583984375, 0.8621826171875, 1.05078125, 1.2393798828125, 1.427978515625, 1.6165771484375, 1.80517578125, 1.9937744140625, 2.182373046875, 2.3709716796875, 2.5595703125, 2.7481689453125, 2.936767578125, 3.1253662109375, 3.31396484375, 3.5025634765625, 3.691162109375, 3.8797607421875, 4.068359375, 4.2569580078125, 4.445556640625, 4.6341552734375, 4.82275390625, 5.0113525390625, 5.199951171875, 5.3885498046875, 5.5771484375, 5.7657470703125, 5.954345703125, 6.1429443359375, 6.33154296875, 6.5201416015625, 6.708740234375, 6.8973388671875, 7.0859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 10.0, 13.0, 11.0, 17.0, 38.0, 57.0, 78.0, 125.0, 219.0, 332.0, 513.0, 874.0, 1453.0, 2303.0, 3857.0, 6682.0, 11116.0, 20028.0, 36821.0, 72995.0, 168816.0, 1474047.0, 150693.0, 66908.0, 34241.0, 18615.0, 10735.0, 6124.0, 3719.0, 2191.0, 1324.0, 838.0, 529.0, 309.0, 185.0, 105.0, 68.0, 60.0, 32.0, 23.0, 13.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.47705078125, -0.4631996154785156, -0.44934844970703125, -0.4354972839355469, -0.4216461181640625, -0.4077949523925781, -0.39394378662109375, -0.3800926208496094, -0.366241455078125, -0.3523902893066406, -0.33853912353515625, -0.3246879577636719, -0.3108367919921875, -0.2969856262207031, -0.28313446044921875, -0.2692832946777344, -0.25543212890625, -0.24158096313476562, -0.22772979736328125, -0.21387863159179688, -0.2000274658203125, -0.18617630004882812, -0.17232513427734375, -0.15847396850585938, -0.144622802734375, -0.13077163696289062, -0.11692047119140625, -0.10306930541992188, -0.0892181396484375, -0.07536697387695312, -0.06151580810546875, -0.047664642333984375, -0.0338134765625, -0.019962310791015625, -0.00611114501953125, 0.007740020751953125, 0.0215911865234375, 0.035442352294921875, 0.04929351806640625, 0.06314468383789062, 0.076995849609375, 0.09084701538085938, 0.10469818115234375, 0.11854934692382812, 0.1324005126953125, 0.14625167846679688, 0.16010284423828125, 0.17395401000976562, 0.18780517578125, 0.20165634155273438, 0.21550750732421875, 0.22935867309570312, 0.2432098388671875, 0.2570610046386719, 0.27091217041015625, 0.2847633361816406, 0.298614501953125, 0.3124656677246094, 0.32631683349609375, 0.3401679992675781, 0.3540191650390625, 0.3678703308105469, 0.38172149658203125, 0.3955726623535156, 0.409423828125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 8.0, 3.0, 13.0, 12.0, 11.0, 20.0, 22.0, 20.0, 31.0, 47.0, 59.0, 96.0, 222.0, 108.0, 71.0, 54.0, 29.0, 24.0, 13.0, 23.0, 12.0, 9.0, 14.0, 15.0, 8.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.519390106201172e-05, -5.3503550589084625e-05, -5.181320011615753e-05, -5.012284964323044e-05, -4.8432499170303345e-05, -4.674214869737625e-05, -4.505179822444916e-05, -4.3361447751522064e-05, -4.167109727859497e-05, -3.998074680566788e-05, -3.8290396332740784e-05, -3.660004585981369e-05, -3.49096953868866e-05, -3.32193449139595e-05, -3.152899444103241e-05, -2.9838643968105316e-05, -2.8148293495178223e-05, -2.645794302225113e-05, -2.4767592549324036e-05, -2.3077242076396942e-05, -2.138689160346985e-05, -1.9696541130542755e-05, -1.800619065761566e-05, -1.6315840184688568e-05, -1.4625489711761475e-05, -1.2935139238834381e-05, -1.1244788765907288e-05, -9.554438292980194e-06, -7.8640878200531e-06, -6.173737347126007e-06, -4.4833868741989136e-06, -2.79303640127182e-06, -1.1026859283447266e-06, 5.876645445823669e-07, 2.2780150175094604e-06, 3.968365490436554e-06, 5.6587159633636475e-06, 7.349066436290741e-06, 9.039416909217834e-06, 1.0729767382144928e-05, 1.2420117855072021e-05, 1.4110468327999115e-05, 1.580081880092621e-05, 1.7491169273853302e-05, 1.9181519746780396e-05, 2.087187021970749e-05, 2.2562220692634583e-05, 2.4252571165561676e-05, 2.594292163848877e-05, 2.7633272111415863e-05, 2.9323622584342957e-05, 3.101397305727005e-05, 3.2704323530197144e-05, 3.439467400312424e-05, 3.608502447605133e-05, 3.7775374948978424e-05, 3.946572542190552e-05, 4.115607589483261e-05, 4.2846426367759705e-05, 4.45367768406868e-05, 4.622712731361389e-05, 4.7917477786540985e-05, 4.960782825946808e-05, 5.129817873239517e-05, 5.2988529205322266e-05]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 13.0, 10.0, 19.0, 29.0, 18.0, 27.0, 42.0, 47.0, 75.0, 101.0, 175.0, 426.0, 2911.0, 287986.0, 751136.0, 4377.0, 501.0, 207.0, 113.0, 75.0, 55.0, 38.0, 30.0, 17.0, 24.0, 15.0, 13.0, 11.0, 8.0, 7.0, 7.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009121894836425781, -0.0008828267455101013, -0.0008534640073776245, -0.0008241012692451477, -0.0007947385311126709, -0.0007653757929801941, -0.0007360130548477173, -0.0007066503167152405, -0.0006772875785827637, -0.0006479248404502869, -0.0006185621023178101, -0.0005891993641853333, -0.0005598366260528564, -0.0005304738879203796, -0.0005011111497879028, -0.000471748411655426, -0.0004423856735229492, -0.0004130229353904724, -0.0003836601972579956, -0.0003542974591255188, -0.000324934720993042, -0.0002955719828605652, -0.0002662092447280884, -0.00023684650659561157, -0.00020748376846313477, -0.00017812103033065796, -0.00014875829219818115, -0.00011939555406570435, -9.003281593322754e-05, -6.067007780075073e-05, -3.1307339668273926e-05, -1.944601535797119e-06, 2.7418136596679688e-05, 5.6780874729156494e-05, 8.61436128616333e-05, 0.00011550635099411011, 0.00014486908912658691, 0.00017423182725906372, 0.00020359456539154053, 0.00023295730352401733, 0.00026232004165649414, 0.00029168277978897095, 0.00032104551792144775, 0.00035040825605392456, 0.00037977099418640137, 0.0004091337323188782, 0.000438496470451355, 0.0004678592085838318, 0.0004972219467163086, 0.0005265846848487854, 0.0005559474229812622, 0.000585310161113739, 0.0006146728992462158, 0.0006440356373786926, 0.0006733983755111694, 0.0007027611136436462, 0.000732123851776123, 0.0007614865899085999, 0.0007908493280410767, 0.0008202120661735535, 0.0008495748043060303, 0.0008789375424385071, 0.0009083002805709839, 0.0009376630187034607, 0.0009670257568359375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 19.0, 44.0, 107.0, 160.0, 251.0, 195.0, 123.0, 69.0, 21.0, 14.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010924146772595122, -0.00010700400162022561, -0.00010476653551449999, -0.00010252907668473199, -0.00010029161057900637, -9.805414447328076e-05, -9.581667836755514e-05, -9.357921226182953e-05, -9.134174615610391e-05, -8.910428005037829e-05, -8.686681394465268e-05, -8.462935511488467e-05, -8.239188900915906e-05, -8.015442290343344e-05, -7.791695679770783e-05, -7.567949069198221e-05, -7.344203186221421e-05, -7.120456575648859e-05, -6.896709965076298e-05, -6.672964082099497e-05, -6.449217471526936e-05, -6.225470860954374e-05, -6.0017242503818125e-05, -5.777977639809251e-05, -5.55423139303457e-05, -5.330484782462008e-05, -5.1067385356873274e-05, -4.882991925114766e-05, -4.659245314542204e-05, -4.435499067767523e-05, -4.2117524571949616e-05, -3.988006210420281e-05, -3.764259599847719e-05, -3.5405129892751575e-05, -3.3167667425004765e-05, -3.093020131927915e-05, -2.8692737032542937e-05, -2.6455272745806724e-05, -2.4217806640081108e-05, -2.1980342353344895e-05, -1.9742878066608682e-05, -1.750541377987247e-05, -1.5267949493136257e-05, -1.303048338741064e-05, -1.0793019100674428e-05, -8.555554813938215e-06, -6.318089617707301e-06, -4.0806244214763865e-06, -1.8431601347401738e-06, 3.9430460674338974e-07, 2.6317693482269533e-06, 4.869234089710517e-06, 7.10669883119408e-06, 9.344163117930293e-06, 1.1581628314161208e-05, 1.3819093510392122e-05, 1.6056557797128335e-05, 1.8294022083864547e-05, 2.053148637060076e-05, 2.2768952476326376e-05, 2.500641676306259e-05, 2.72438810497988e-05, 2.9481347155524418e-05, 3.171880962327123e-05, 3.395627572899684e-05]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 5.0, 7.0, 10.0, 10.0, 10.0, 14.0, 13.0, 19.0, 23.0, 16.0, 24.0, 31.0, 20.0, 25.0, 32.0, 36.0, 33.0, 30.0, 40.0, 40.0, 37.0, 36.0, 40.0, 31.0, 35.0, 33.0, 33.0, 31.0, 27.0, 36.0, 26.0, 25.0, 30.0, 17.0, 16.0, 10.0, 16.0, 4.0, 12.0, 10.0, 14.0, 8.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.092123031616211e-05, -2.0248815417289734e-05, -1.957640051841736e-05, -1.8903985619544983e-05, -1.8231570720672607e-05, -1.7559155821800232e-05, -1.6886740922927856e-05, -1.621432602405548e-05, -1.5541911125183105e-05, -1.486949622631073e-05, -1.4197081327438354e-05, -1.3524666428565979e-05, -1.2852251529693604e-05, -1.2179836630821228e-05, -1.1507421731948853e-05, -1.0835006833076477e-05, -1.0162591934204102e-05, -9.490177035331726e-06, -8.81776213645935e-06, -8.145347237586975e-06, -7.4729323387146e-06, -6.800517439842224e-06, -6.128102540969849e-06, -5.455687642097473e-06, -4.783272743225098e-06, -4.110857844352722e-06, -3.4384429454803467e-06, -2.766028046607971e-06, -2.0936131477355957e-06, -1.4211982488632202e-06, -7.487833499908447e-07, -7.636845111846924e-08, 5.960464477539062e-07, 1.2684613466262817e-06, 1.9408762454986572e-06, 2.6132911443710327e-06, 3.285706043243408e-06, 3.958120942115784e-06, 4.630535840988159e-06, 5.302950739860535e-06, 5.97536563873291e-06, 6.647780537605286e-06, 7.320195436477661e-06, 7.992610335350037e-06, 8.665025234222412e-06, 9.337440133094788e-06, 1.0009855031967163e-05, 1.0682269930839539e-05, 1.1354684829711914e-05, 1.202709972858429e-05, 1.2699514627456665e-05, 1.337192952632904e-05, 1.4044344425201416e-05, 1.4716759324073792e-05, 1.5389174222946167e-05, 1.6061589121818542e-05, 1.6734004020690918e-05, 1.7406418919563293e-05, 1.807883381843567e-05, 1.8751248717308044e-05, 1.942366361618042e-05, 2.0096078515052795e-05, 2.076849341392517e-05, 2.1440908312797546e-05, 2.2113323211669922e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 8.0, 8.0, 6.0, 13.0, 11.0, 24.0, 17.0, 14.0, 28.0, 21.0, 31.0, 35.0, 40.0, 42.0, 37.0, 33.0, 42.0, 45.0, 35.0, 46.0, 38.0, 34.0, 36.0, 30.0, 36.0, 35.0, 39.0, 31.0, 26.0, 18.0, 18.0, 22.0, 17.0, 22.0, 10.0, 9.0, 8.0, 5.0, 4.0, 7.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.4140625, -7.2025146484375, -6.990966796875, -6.7794189453125, -6.56787109375, -6.3563232421875, -6.144775390625, -5.9332275390625, -5.7216796875, -5.5101318359375, -5.298583984375, -5.0870361328125, -4.87548828125, -4.6639404296875, -4.452392578125, -4.2408447265625, -4.029296875, -3.8177490234375, -3.606201171875, -3.3946533203125, -3.18310546875, -2.9715576171875, -2.760009765625, -2.5484619140625, -2.3369140625, -2.1253662109375, -1.913818359375, -1.7022705078125, -1.49072265625, -1.2791748046875, -1.067626953125, -0.8560791015625, -0.64453125, -0.4329833984375, -0.221435546875, -0.0098876953125, 0.20166015625, 0.4132080078125, 0.624755859375, 0.8363037109375, 1.0478515625, 1.2593994140625, 1.470947265625, 1.6824951171875, 1.89404296875, 2.1055908203125, 2.317138671875, 2.5286865234375, 2.740234375, 2.9517822265625, 3.163330078125, 3.3748779296875, 3.58642578125, 3.7979736328125, 4.009521484375, 4.2210693359375, 4.4326171875, 4.6441650390625, 4.855712890625, 5.0672607421875, 5.27880859375, 5.4903564453125, 5.701904296875, 5.9134521484375, 6.125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 6.0, 7.0, 15.0, 20.0, 21.0, 29.0, 42.0, 50.0, 76.0, 117.0, 155.0, 265.0, 448.0, 716.0, 1246.0, 2358.0, 4489.0, 9476.0, 21434.0, 53496.0, 151900.0, 402135.0, 253893.0, 86096.0, 32653.0, 13939.0, 6253.0, 3133.0, 1671.0, 927.0, 498.0, 309.0, 208.0, 151.0, 67.0, 65.0, 55.0, 35.0, 23.0, 19.0, 21.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.1885986328125, -9.845947265625, -9.5032958984375, -9.16064453125, -8.8179931640625, -8.475341796875, -8.1326904296875, -7.7900390625, -7.4473876953125, -7.104736328125, -6.7620849609375, -6.41943359375, -6.0767822265625, -5.734130859375, -5.3914794921875, -5.048828125, -4.7061767578125, -4.363525390625, -4.0208740234375, -3.67822265625, -3.3355712890625, -2.992919921875, -2.6502685546875, -2.3076171875, -1.9649658203125, -1.622314453125, -1.2796630859375, -0.93701171875, -0.5943603515625, -0.251708984375, 0.0909423828125, 0.43359375, 0.7762451171875, 1.118896484375, 1.4615478515625, 1.80419921875, 2.1468505859375, 2.489501953125, 2.8321533203125, 3.1748046875, 3.5174560546875, 3.860107421875, 4.2027587890625, 4.54541015625, 4.8880615234375, 5.230712890625, 5.5733642578125, 5.916015625, 6.2586669921875, 6.601318359375, 6.9439697265625, 7.28662109375, 7.6292724609375, 7.971923828125, 8.3145751953125, 8.6572265625, 8.9998779296875, 9.342529296875, 9.6851806640625, 10.02783203125, 10.3704833984375, 10.713134765625, 11.0557861328125, 11.3984375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 1.0, 9.0, 7.0, 7.0, 12.0, 21.0, 22.0, 15.0, 23.0, 21.0, 35.0, 39.0, 42.0, 26.0, 55.0, 60.0, 94.0, 162.0, 300.0, 1394.0, 174.0, 91.0, 91.0, 58.0, 46.0, 33.0, 37.0, 27.0, 14.0, 23.0, 16.0, 24.0, 13.0, 9.0, 10.0, 8.0, 8.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-16.328125, -15.8350830078125, -15.342041015625, -14.8489990234375, -14.35595703125, -13.8629150390625, -13.369873046875, -12.8768310546875, -12.3837890625, -11.8907470703125, -11.397705078125, -10.9046630859375, -10.41162109375, -9.9185791015625, -9.425537109375, -8.9324951171875, -8.439453125, -7.9464111328125, -7.453369140625, -6.9603271484375, -6.46728515625, -5.9742431640625, -5.481201171875, -4.9881591796875, -4.4951171875, -4.0020751953125, -3.509033203125, -3.0159912109375, -2.52294921875, -2.0299072265625, -1.536865234375, -1.0438232421875, -0.55078125, -0.0577392578125, 0.435302734375, 0.9283447265625, 1.42138671875, 1.9144287109375, 2.407470703125, 2.9005126953125, 3.3935546875, 3.8865966796875, 4.379638671875, 4.8726806640625, 5.36572265625, 5.8587646484375, 6.351806640625, 6.8448486328125, 7.337890625, 7.8309326171875, 8.323974609375, 8.8170166015625, 9.31005859375, 9.8031005859375, 10.296142578125, 10.7891845703125, 11.2822265625, 11.7752685546875, 12.268310546875, 12.7613525390625, 13.25439453125, 13.7474365234375, 14.240478515625, 14.7335205078125, 15.2265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 8.0, 10.0, 13.0, 16.0, 22.0, 18.0, 34.0, 34.0, 59.0, 64.0, 110.0, 233.0, 338.0, 697.0, 2434.0, 50406.0, 3055459.0, 32082.0, 2041.0, 652.0, 362.0, 179.0, 110.0, 102.0, 61.0, 32.0, 29.0, 25.0, 13.0, 14.0, 9.0, 12.0, 4.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-47.4375, -46.060546875, -44.68359375, -43.306640625, -41.9296875, -40.552734375, -39.17578125, -37.798828125, -36.421875, -35.044921875, -33.66796875, -32.291015625, -30.9140625, -29.537109375, -28.16015625, -26.783203125, -25.40625, -24.029296875, -22.65234375, -21.275390625, -19.8984375, -18.521484375, -17.14453125, -15.767578125, -14.390625, -13.013671875, -11.63671875, -10.259765625, -8.8828125, -7.505859375, -6.12890625, -4.751953125, -3.375, -1.998046875, -0.62109375, 0.755859375, 2.1328125, 3.509765625, 4.88671875, 6.263671875, 7.640625, 9.017578125, 10.39453125, 11.771484375, 13.1484375, 14.525390625, 15.90234375, 17.279296875, 18.65625, 20.033203125, 21.41015625, 22.787109375, 24.1640625, 25.541015625, 26.91796875, 28.294921875, 29.671875, 31.048828125, 32.42578125, 33.802734375, 35.1796875, 36.556640625, 37.93359375, 39.310546875, 40.6875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 68.0, 298.0, 461.0, 153.0, 23.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.20106506347656, -181.29483032226562, -174.38861083984375, -167.4823760986328, -160.57614135742188, -153.669921875, -146.76368713378906, -139.85745239257812, -132.95123291015625, -126.04500579833984, -119.1387710571289, -112.2325439453125, -105.32630920410156, -98.42008209228516, -91.51385498046875, -84.60762023925781, -77.70138549804688, -70.79515838623047, -63.88892364501953, -56.982696533203125, -50.07646560668945, -43.17023468017578, -36.264007568359375, -29.357776641845703, -22.45154571533203, -15.545315742492676, -8.63908576965332, -1.7328567504882812, 5.173374176025391, 12.079605102539062, 18.98583221435547, 25.89206314086914, 32.79829406738281, 39.704524993896484, 46.610755920410156, 53.51698303222656, 60.423213958740234, 67.3294448852539, 74.23567199707031, 81.14190673828125, 88.04813385009766, 94.95436096191406, 101.860595703125, 108.7668228149414, 115.67304992675781, 122.57928466796875, 129.48550415039062, 136.39173889160156, 143.2979736328125, 150.20420837402344, 157.1104278564453, 164.01666259765625, 170.9228973388672, 177.82913208007812, 184.7353515625, 191.64158630371094, 198.54782104492188, 205.4540557861328, 212.3602752685547, 219.26651000976562, 226.17274475097656, 233.0789794921875, 239.98519897460938, 246.8914337158203, 253.7976531982422]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 11.0, 4.0, 4.0, 5.0, 8.0, 9.0, 8.0, 16.0, 17.0, 26.0, 17.0, 28.0, 31.0, 33.0, 34.0, 34.0, 37.0, 33.0, 40.0, 37.0, 43.0, 45.0, 42.0, 38.0, 36.0, 40.0, 33.0, 32.0, 28.0, 32.0, 26.0, 41.0, 24.0, 24.0, 13.0, 19.0, 10.0, 10.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.89122009277344, -44.104270935058594, -42.31732177734375, -40.530372619628906, -38.74342346191406, -36.95647430419922, -35.16952896118164, -33.3825798034668, -31.595630645751953, -29.80868148803711, -28.021732330322266, -26.234785079956055, -24.44783592224121, -22.660886764526367, -20.873939514160156, -19.086990356445312, -17.30004119873047, -15.513092041015625, -13.726143836975098, -11.93919563293457, -10.152246475219727, -8.365297317504883, -6.5783491134643555, -4.791400909423828, -3.0044517517089844, -1.2175030708312988, 0.5694456100463867, 2.3563942909240723, 4.143342971801758, 5.930292129516602, 7.717240333557129, 9.504188537597656, 11.2911376953125, 13.078086853027344, 14.865035057067871, 16.6519832611084, 18.438932418823242, 20.225881576538086, 22.012828826904297, 23.79977798461914, 25.586727142333984, 27.373676300048828, 29.160625457763672, 30.947572708129883, 32.734519958496094, 34.52146911621094, 36.30841827392578, 38.095367431640625, 39.88231658935547, 41.66926574707031, 43.456214904785156, 45.2431640625, 47.030113220214844, 48.81706237792969, 50.604007720947266, 52.39095687866211, 54.17790603637695, 55.9648551940918, 57.75180435180664, 59.538753509521484, 61.32569885253906, 63.112648010253906, 64.89959716796875, 66.6865463256836, 68.47349548339844]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 10.0, 5.0, 9.0, 7.0, 9.0, 17.0, 21.0, 22.0, 35.0, 39.0, 27.0, 39.0, 31.0, 41.0, 40.0, 50.0, 56.0, 43.0, 31.0, 45.0, 41.0, 41.0, 34.0, 39.0, 29.0, 42.0, 39.0, 21.0, 25.0, 17.0, 16.0, 17.0, 13.0, 14.0, 9.0, 10.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.15625, -7.9105224609375, -7.664794921875, -7.4190673828125, -7.17333984375, -6.9276123046875, -6.681884765625, -6.4361572265625, -6.1904296875, -5.9447021484375, -5.698974609375, -5.4532470703125, -5.20751953125, -4.9617919921875, -4.716064453125, -4.4703369140625, -4.224609375, -3.9788818359375, -3.733154296875, -3.4874267578125, -3.24169921875, -2.9959716796875, -2.750244140625, -2.5045166015625, -2.2587890625, -2.0130615234375, -1.767333984375, -1.5216064453125, -1.27587890625, -1.0301513671875, -0.784423828125, -0.5386962890625, -0.29296875, -0.0472412109375, 0.198486328125, 0.4442138671875, 0.68994140625, 0.9356689453125, 1.181396484375, 1.4271240234375, 1.6728515625, 1.9185791015625, 2.164306640625, 2.4100341796875, 2.65576171875, 2.9014892578125, 3.147216796875, 3.3929443359375, 3.638671875, 3.8843994140625, 4.130126953125, 4.3758544921875, 4.62158203125, 4.8673095703125, 5.113037109375, 5.3587646484375, 5.6044921875, 5.8502197265625, 6.095947265625, 6.3416748046875, 6.58740234375, 6.8331298828125, 7.078857421875, 7.3245849609375, 7.5703125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 10.0, 11.0, 8.0, 17.0, 28.0, 31.0, 42.0, 59.0, 79.0, 143.0, 211.0, 334.0, 467.0, 713.0, 1177.0, 2083.0, 3803.0, 6774.0, 13500.0, 30105.0, 104381.0, 738181.0, 2504754.0, 638347.0, 92416.0, 28549.0, 12554.0, 6646.0, 3573.0, 1964.0, 1198.0, 736.0, 453.0, 317.0, 199.0, 123.0, 84.0, 46.0, 47.0, 33.0, 21.0, 17.0, 8.0, 14.0, 5.0, 3.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.453125, -14.9913330078125, -14.529541015625, -14.0677490234375, -13.60595703125, -13.1441650390625, -12.682373046875, -12.2205810546875, -11.7587890625, -11.2969970703125, -10.835205078125, -10.3734130859375, -9.91162109375, -9.4498291015625, -8.988037109375, -8.5262451171875, -8.064453125, -7.6026611328125, -7.140869140625, -6.6790771484375, -6.21728515625, -5.7554931640625, -5.293701171875, -4.8319091796875, -4.3701171875, -3.9083251953125, -3.446533203125, -2.9847412109375, -2.52294921875, -2.0611572265625, -1.599365234375, -1.1375732421875, -0.67578125, -0.2139892578125, 0.247802734375, 0.7095947265625, 1.17138671875, 1.6331787109375, 2.094970703125, 2.5567626953125, 3.0185546875, 3.4803466796875, 3.942138671875, 4.4039306640625, 4.86572265625, 5.3275146484375, 5.789306640625, 6.2510986328125, 6.712890625, 7.1746826171875, 7.636474609375, 8.0982666015625, 8.56005859375, 9.0218505859375, 9.483642578125, 9.9454345703125, 10.4072265625, 10.8690185546875, 11.330810546875, 11.7926025390625, 12.25439453125, 12.7161865234375, 13.177978515625, 13.6397705078125, 14.1015625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 12.0, 9.0, 17.0, 32.0, 37.0, 59.0, 102.0, 116.0, 198.0, 340.0, 601.0, 795.0, 612.0, 360.0, 252.0, 165.0, 109.0, 70.0, 44.0, 36.0, 21.0, 20.0, 10.0, 9.0, 7.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-19.125, -18.6644287109375, -18.203857421875, -17.7432861328125, -17.28271484375, -16.8221435546875, -16.361572265625, -15.9010009765625, -15.4404296875, -14.9798583984375, -14.519287109375, -14.0587158203125, -13.59814453125, -13.1375732421875, -12.677001953125, -12.2164306640625, -11.755859375, -11.2952880859375, -10.834716796875, -10.3741455078125, -9.91357421875, -9.4530029296875, -8.992431640625, -8.5318603515625, -8.0712890625, -7.6107177734375, -7.150146484375, -6.6895751953125, -6.22900390625, -5.7684326171875, -5.307861328125, -4.8472900390625, -4.38671875, -3.9261474609375, -3.465576171875, -3.0050048828125, -2.54443359375, -2.0838623046875, -1.623291015625, -1.1627197265625, -0.7021484375, -0.2415771484375, 0.218994140625, 0.6795654296875, 1.14013671875, 1.6007080078125, 2.061279296875, 2.5218505859375, 2.982421875, 3.4429931640625, 3.903564453125, 4.3641357421875, 4.82470703125, 5.2852783203125, 5.745849609375, 6.2064208984375, 6.6669921875, 7.1275634765625, 7.588134765625, 8.0487060546875, 8.50927734375, 8.9698486328125, 9.430419921875, 9.8909912109375, 10.3515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 7.0, 9.0, 20.0, 24.0, 27.0, 51.0, 98.0, 196.0, 362.0, 862.0, 2581.0, 9427.0, 61917.0, 2524054.0, 1532893.0, 49763.0, 8197.0, 2268.0, 798.0, 324.0, 171.0, 105.0, 41.0, 18.0, 20.0, 10.0, 12.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -21.887451171875, -20.79052734375, -19.693603515625, -18.5966796875, -17.499755859375, -16.40283203125, -15.305908203125, -14.208984375, -13.112060546875, -12.01513671875, -10.918212890625, -9.8212890625, -8.724365234375, -7.62744140625, -6.530517578125, -5.43359375, -4.336669921875, -3.23974609375, -2.142822265625, -1.0458984375, 0.051025390625, 1.14794921875, 2.244873046875, 3.341796875, 4.438720703125, 5.53564453125, 6.632568359375, 7.7294921875, 8.826416015625, 9.92333984375, 11.020263671875, 12.1171875, 13.214111328125, 14.31103515625, 15.407958984375, 16.5048828125, 17.601806640625, 18.69873046875, 19.795654296875, 20.892578125, 21.989501953125, 23.08642578125, 24.183349609375, 25.2802734375, 26.377197265625, 27.47412109375, 28.571044921875, 29.66796875, 30.764892578125, 31.86181640625, 32.958740234375, 34.0556640625, 35.152587890625, 36.24951171875, 37.346435546875, 38.443359375, 39.540283203125, 40.63720703125, 41.734130859375, 42.8310546875, 43.927978515625, 45.02490234375, 46.121826171875, 47.21875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 21.0, 168.0, 535.0, 245.0, 41.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-530.4069213867188, -519.2615356445312, -508.1162109375, -496.9708251953125, -485.8254699707031, -474.68011474609375, -463.5347595214844, -452.389404296875, -441.2440185546875, -430.0986633300781, -418.95330810546875, -407.80792236328125, -396.6625671386719, -385.5172119140625, -374.3718566894531, -363.22650146484375, -352.0811462402344, -340.935791015625, -329.7904357910156, -318.64508056640625, -307.49969482421875, -296.3543395996094, -285.208984375, -274.0636291503906, -262.91827392578125, -251.77291870117188, -240.62754821777344, -229.48219299316406, -218.33682250976562, -207.19146728515625, -196.04611206054688, -184.9007568359375, -173.75538635253906, -162.6100311279297, -151.46466064453125, -140.31930541992188, -129.1739501953125, -118.02857971191406, -106.88322448730469, -95.73786163330078, -84.59249877929688, -73.44713592529297, -62.30177688598633, -51.15641784667969, -40.01105499267578, -28.865692138671875, -17.7203369140625, -6.574974060058594, 4.5703887939453125, 15.715749740600586, 26.86111068725586, 38.0064697265625, 49.151832580566406, 60.29719543457031, 71.44255065917969, 82.5879135131836, 93.7332763671875, 104.8786392211914, 116.02400207519531, 127.16935729980469, 138.31472778320312, 149.4600830078125, 160.60543823242188, 171.75079345703125, 182.8961639404297]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 14.0, 11.0, 12.0, 17.0, 17.0, 18.0, 26.0, 27.0, 30.0, 39.0, 28.0, 33.0, 28.0, 46.0, 41.0, 44.0, 48.0, 38.0, 41.0, 34.0, 26.0, 29.0, 33.0, 47.0, 30.0, 26.0, 33.0, 23.0, 21.0, 15.0, 17.0, 17.0, 6.0, 11.0, 9.0, 13.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-47.7168083190918, -46.3427848815918, -44.9687614440918, -43.59473419189453, -42.22071075439453, -40.84668731689453, -39.47266387939453, -38.09864044189453, -36.72461700439453, -35.35059356689453, -33.97657012939453, -32.60254669189453, -31.228519439697266, -29.854496002197266, -28.480472564697266, -27.106449127197266, -25.732421875, -24.3583984375, -22.984373092651367, -21.610349655151367, -20.236324310302734, -18.862300872802734, -17.488277435302734, -16.114253997802734, -14.740228652954102, -13.366204261779785, -11.992179870605469, -10.618156433105469, -9.244132041931152, -7.870107650756836, -6.496084213256836, -5.1220598220825195, -3.7480316162109375, -2.3740074634552, -0.9999833106994629, 0.3740406036376953, 1.7480649948120117, 3.122089385986328, 4.496112823486328, 5.8701372146606445, 7.244161605834961, 8.618185997009277, 9.992210388183594, 11.366233825683594, 12.74025821685791, 14.114282608032227, 15.488306045532227, 16.86233139038086, 18.23635482788086, 19.61037826538086, 20.984403610229492, 22.358427047729492, 23.732452392578125, 25.106475830078125, 26.480499267578125, 27.854522705078125, 29.228548049926758, 30.602571487426758, 31.97659683227539, 33.35062026977539, 34.72464370727539, 36.098670959472656, 37.472694396972656, 38.846717834472656, 40.220741271972656]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 12.0, 10.0, 10.0, 12.0, 17.0, 17.0, 34.0, 14.0, 19.0, 24.0, 28.0, 30.0, 32.0, 33.0, 33.0, 38.0, 40.0, 42.0, 55.0, 39.0, 41.0, 27.0, 37.0, 43.0, 28.0, 36.0, 22.0, 33.0, 25.0, 26.0, 22.0, 15.0, 18.0, 13.0, 13.0, 6.0, 5.0, 7.0, 9.0, 6.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-8.1015625, -7.85565185546875, -7.6097412109375, -7.36383056640625, -7.117919921875, -6.87200927734375, -6.6260986328125, -6.38018798828125, -6.13427734375, -5.88836669921875, -5.6424560546875, -5.39654541015625, -5.150634765625, -4.90472412109375, -4.6588134765625, -4.41290283203125, -4.1669921875, -3.92108154296875, -3.6751708984375, -3.42926025390625, -3.183349609375, -2.93743896484375, -2.6915283203125, -2.44561767578125, -2.19970703125, -1.95379638671875, -1.7078857421875, -1.46197509765625, -1.216064453125, -0.97015380859375, -0.7242431640625, -0.47833251953125, -0.232421875, 0.01348876953125, 0.2593994140625, 0.50531005859375, 0.751220703125, 0.99713134765625, 1.2430419921875, 1.48895263671875, 1.73486328125, 1.98077392578125, 2.2266845703125, 2.47259521484375, 2.718505859375, 2.96441650390625, 3.2103271484375, 3.45623779296875, 3.7021484375, 3.94805908203125, 4.1939697265625, 4.43988037109375, 4.685791015625, 4.93170166015625, 5.1776123046875, 5.42352294921875, 5.66943359375, 5.91534423828125, 6.1612548828125, 6.40716552734375, 6.653076171875, 6.89898681640625, 7.1448974609375, 7.39080810546875, 7.63671875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 12.0, 17.0, 23.0, 36.0, 49.0, 82.0, 101.0, 141.0, 227.0, 283.0, 425.0, 637.0, 888.0, 1295.0, 1887.0, 2829.0, 4208.0, 6167.0, 9268.0, 14425.0, 22516.0, 35211.0, 58244.0, 101583.0, 256280.0, 268212.0, 103043.0, 58782.0, 35677.0, 22441.0, 14598.0, 9436.0, 6302.0, 4205.0, 2871.0, 1953.0, 1257.0, 925.0, 588.0, 450.0, 293.0, 206.0, 156.0, 103.0, 79.0, 43.0, 41.0, 24.0, 17.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.7421875, -0.7182540893554688, -0.6943206787109375, -0.6703872680664062, -0.646453857421875, -0.6225204467773438, -0.5985870361328125, -0.5746536254882812, -0.55072021484375, -0.5267868041992188, -0.5028533935546875, -0.47891998291015625, -0.454986572265625, -0.43105316162109375, -0.4071197509765625, -0.38318634033203125, -0.3592529296875, -0.33531951904296875, -0.3113861083984375, -0.28745269775390625, -0.263519287109375, -0.23958587646484375, -0.2156524658203125, -0.19171905517578125, -0.16778564453125, -0.14385223388671875, -0.1199188232421875, -0.09598541259765625, -0.072052001953125, -0.04811859130859375, -0.0241851806640625, -0.00025177001953125, 0.023681640625, 0.04761505126953125, 0.0715484619140625, 0.09548187255859375, 0.119415283203125, 0.14334869384765625, 0.1672821044921875, 0.19121551513671875, 0.21514892578125, 0.23908233642578125, 0.2630157470703125, 0.28694915771484375, 0.310882568359375, 0.33481597900390625, 0.3587493896484375, 0.38268280029296875, 0.4066162109375, 0.43054962158203125, 0.4544830322265625, 0.47841644287109375, 0.502349853515625, 0.5262832641601562, 0.5502166748046875, 0.5741500854492188, 0.59808349609375, 0.6220169067382812, 0.6459503173828125, 0.6698837280273438, 0.693817138671875, 0.7177505493164062, 0.7416839599609375, 0.7656173706054688, 0.78955078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 10.0, 8.0, 10.0, 10.0, 22.0, 11.0, 29.0, 19.0, 18.0, 25.0, 22.0, 25.0, 25.0, 42.0, 37.0, 42.0, 42.0, 38.0, 32.0, 1065.0, 36.0, 44.0, 42.0, 33.0, 36.0, 23.0, 30.0, 31.0, 31.0, 24.0, 24.0, 16.0, 11.0, 22.0, 13.0, 21.0, 5.0, 12.0, 8.0, 5.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-8.2421875, -7.998291015625, -7.75439453125, -7.510498046875, -7.2666015625, -7.022705078125, -6.77880859375, -6.534912109375, -6.291015625, -6.047119140625, -5.80322265625, -5.559326171875, -5.3154296875, -5.071533203125, -4.82763671875, -4.583740234375, -4.33984375, -4.095947265625, -3.85205078125, -3.608154296875, -3.3642578125, -3.120361328125, -2.87646484375, -2.632568359375, -2.388671875, -2.144775390625, -1.90087890625, -1.656982421875, -1.4130859375, -1.169189453125, -0.92529296875, -0.681396484375, -0.4375, -0.193603515625, 0.05029296875, 0.294189453125, 0.5380859375, 0.781982421875, 1.02587890625, 1.269775390625, 1.513671875, 1.757568359375, 2.00146484375, 2.245361328125, 2.4892578125, 2.733154296875, 2.97705078125, 3.220947265625, 3.46484375, 3.708740234375, 3.95263671875, 4.196533203125, 4.4404296875, 4.684326171875, 4.92822265625, 5.172119140625, 5.416015625, 5.659912109375, 5.90380859375, 6.147705078125, 6.3916015625, 6.635498046875, 6.87939453125, 7.123291015625, 7.3671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 12.0, 25.0, 29.0, 42.0, 62.0, 91.0, 133.0, 189.0, 272.0, 415.0, 587.0, 853.0, 1331.0, 1931.0, 2900.0, 4428.0, 6802.0, 10430.0, 16599.0, 26553.0, 44874.0, 80896.0, 174879.0, 1410736.0, 137929.0, 69476.0, 38965.0, 23458.0, 14610.0, 9315.0, 6105.0, 3952.0, 2733.0, 1711.0, 1201.0, 796.0, 566.0, 355.0, 284.0, 180.0, 115.0, 91.0, 67.0, 46.0, 23.0, 15.0, 17.0, 10.0, 11.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49560546875, -0.47928619384765625, -0.4629669189453125, -0.44664764404296875, -0.430328369140625, -0.41400909423828125, -0.3976898193359375, -0.38137054443359375, -0.36505126953125, -0.34873199462890625, -0.3324127197265625, -0.31609344482421875, -0.299774169921875, -0.28345489501953125, -0.2671356201171875, -0.25081634521484375, -0.2344970703125, -0.21817779541015625, -0.2018585205078125, -0.18553924560546875, -0.169219970703125, -0.15290069580078125, -0.1365814208984375, -0.12026214599609375, -0.10394287109375, -0.08762359619140625, -0.0713043212890625, -0.05498504638671875, -0.038665771484375, -0.02234649658203125, -0.0060272216796875, 0.01029205322265625, 0.026611328125, 0.04293060302734375, 0.0592498779296875, 0.07556915283203125, 0.091888427734375, 0.10820770263671875, 0.1245269775390625, 0.14084625244140625, 0.15716552734375, 0.17348480224609375, 0.1898040771484375, 0.20612335205078125, 0.222442626953125, 0.23876190185546875, 0.2550811767578125, 0.27140045166015625, 0.2877197265625, 0.30403900146484375, 0.3203582763671875, 0.33667755126953125, 0.352996826171875, 0.36931610107421875, 0.3856353759765625, 0.40195465087890625, 0.41827392578125, 0.43459320068359375, 0.4509124755859375, 0.46723175048828125, 0.483551025390625, 0.49987030029296875, 0.5161895751953125, 0.5325088500976562, 0.548828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 6.0, 1.0, 8.0, 7.0, 7.0, 9.0, 11.0, 18.0, 7.0, 17.0, 25.0, 28.0, 26.0, 36.0, 38.0, 53.0, 77.0, 129.0, 107.0, 80.0, 58.0, 52.0, 35.0, 28.0, 22.0, 25.0, 12.0, 17.0, 12.0, 10.0, 5.0, 14.0, 4.0, 13.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.456541061401367e-05, -7.21486285328865e-05, -6.973184645175934e-05, -6.731506437063217e-05, -6.4898282289505e-05, -6.248150020837784e-05, -6.006471812725067e-05, -5.7647936046123505e-05, -5.523115396499634e-05, -5.281437188386917e-05, -5.0397589802742004e-05, -4.798080772161484e-05, -4.556402564048767e-05, -4.3147243559360504e-05, -4.073046147823334e-05, -3.831367939710617e-05, -3.5896897315979004e-05, -3.348011523485184e-05, -3.106333315372467e-05, -2.8646551072597504e-05, -2.6229768991470337e-05, -2.381298691034317e-05, -2.1396204829216003e-05, -1.8979422748088837e-05, -1.656264066696167e-05, -1.4145858585834503e-05, -1.1729076504707336e-05, -9.31229442358017e-06, -6.895512342453003e-06, -4.478730261325836e-06, -2.0619481801986694e-06, 3.548339009284973e-07, 2.771615982055664e-06, 5.188398063182831e-06, 7.6051801443099976e-06, 1.0021962225437164e-05, 1.2438744306564331e-05, 1.4855526387691498e-05, 1.7272308468818665e-05, 1.968909054994583e-05, 2.2105872631072998e-05, 2.4522654712200165e-05, 2.693943679332733e-05, 2.9356218874454498e-05, 3.1773000955581665e-05, 3.418978303670883e-05, 3.6606565117836e-05, 3.9023347198963165e-05, 4.144012928009033e-05, 4.38569113612175e-05, 4.6273693442344666e-05, 4.869047552347183e-05, 5.1107257604599e-05, 5.3524039685726166e-05, 5.594082176685333e-05, 5.83576038479805e-05, 6.0774385929107666e-05, 6.319116801023483e-05, 6.5607950091362e-05, 6.802473217248917e-05, 7.044151425361633e-05, 7.28582963347435e-05, 7.527507841587067e-05, 7.769186049699783e-05, 8.0108642578125e-05]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 6.0, 23.0, 17.0, 32.0, 23.0, 27.0, 41.0, 49.0, 72.0, 77.0, 148.0, 186.0, 349.0, 664.0, 2658.0, 55830.0, 950236.0, 34509.0, 2018.0, 558.0, 329.0, 182.0, 128.0, 89.0, 83.0, 49.0, 31.0, 33.0, 27.0, 15.0, 10.0, 11.0, 13.0, 6.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011453628540039062, -0.0011089295148849487, -0.0010724961757659912, -0.0010360628366470337, -0.0009996294975280762, -0.0009631961584091187, -0.0009267628192901611, -0.0008903294801712036, -0.0008538961410522461, -0.0008174628019332886, -0.0007810294628143311, -0.0007445961236953735, -0.000708162784576416, -0.0006717294454574585, -0.000635296106338501, -0.0005988627672195435, -0.0005624294281005859, -0.0005259960889816284, -0.0004895627498626709, -0.0004531294107437134, -0.00041669607162475586, -0.00038026273250579834, -0.0003438293933868408, -0.0003073960542678833, -0.0002709627151489258, -0.00023452937602996826, -0.00019809603691101074, -0.00016166269779205322, -0.0001252293586730957, -8.879601955413818e-05, -5.2362680435180664e-05, -1.5929341316223145e-05, 2.0503997802734375e-05, 5.6937336921691895e-05, 9.337067604064941e-05, 0.00012980401515960693, 0.00016623735427856445, 0.00020267069339752197, 0.0002391040325164795, 0.000275537371635437, 0.00031197071075439453, 0.00034840404987335205, 0.00038483738899230957, 0.0004212707281112671, 0.0004577040672302246, 0.0004941374063491821, 0.0005305707454681396, 0.0005670040845870972, 0.0006034374237060547, 0.0006398707628250122, 0.0006763041019439697, 0.0007127374410629272, 0.0007491707801818848, 0.0007856041193008423, 0.0008220374584197998, 0.0008584707975387573, 0.0008949041366577148, 0.0009313374757766724, 0.0009677708148956299, 0.0010042041540145874, 0.001040637493133545, 0.0010770708322525024, 0.00111350417137146, 0.0011499375104904175, 0.001186370849609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 16.0, 39.0, 84.0, 201.0, 310.0, 189.0, 92.0, 46.0, 13.0, 8.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11629953305237e-05, -3.721842949744314e-05, -3.327386366436258e-05, -2.9329294193303213e-05, -2.5384728360222653e-05, -2.1440162527142093e-05, -1.749559487507213e-05, -1.3551027223002166e-05, -9.606461389921606e-06, -5.661894647346344e-06, -1.717327904771082e-06, 2.2272388378041796e-06, 6.171805580379441e-06, 1.0116371413460001e-05, 1.4060939065529965e-05, 1.800550671759993e-05, 2.195007255068049e-05, 2.589463838376105e-05, 2.9839206035831012e-05, 3.3783773687900975e-05, 3.7728339520981535e-05, 4.1672905354062095e-05, 4.561747482512146e-05, 4.956204065820202e-05, 5.350660649128258e-05, 5.745117232436314e-05, 6.13957381574437e-05, 6.534030399052426e-05, 6.928486982360482e-05, 7.3229442932643e-05, 7.717400876572356e-05, 8.111857459880412e-05, 8.506314770784229e-05, 8.900771354092285e-05, 9.295227937400341e-05, 9.689684520708397e-05, 0.00010084141104016453, 0.0001047859841492027, 0.00010873054998228326, 0.00011267511581536382, 0.00011661968164844438, 0.00012056424748152494, 0.00012450882059056312, 0.00012845337914768606, 0.00013239795225672424, 0.00013634251081384718, 0.00014028708392288536, 0.00014423165703192353, 0.00014817621558904648, 0.00015212078869808465, 0.0001560653472552076, 0.00016000992036424577, 0.00016395447892136872, 0.0001678990520304069, 0.00017184361058752984, 0.000175788183696568, 0.00017973274225369096, 0.00018367731536272913, 0.00018762187391985208, 0.00019156644702889025, 0.0001955110055860132, 0.00019945557869505137, 0.00020340013725217432, 0.0002073447103612125, 0.00021128928347025067]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 8.0, 14.0, 14.0, 15.0, 15.0, 14.0, 17.0, 32.0, 26.0, 29.0, 33.0, 47.0, 41.0, 46.0, 38.0, 38.0, 35.0, 49.0, 49.0, 37.0, 26.0, 34.0, 37.0, 31.0, 25.0, 22.0, 32.0, 32.0, 31.0, 16.0, 18.0, 17.0, 10.0, 12.0, 5.0, 10.0, 8.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.55839729309082e-05, -3.4489668905735016e-05, -3.339536488056183e-05, -3.230106085538864e-05, -3.1206756830215454e-05, -3.0112452805042267e-05, -2.901814877986908e-05, -2.7923844754695892e-05, -2.6829540729522705e-05, -2.5735236704349518e-05, -2.464093267917633e-05, -2.3546628654003143e-05, -2.2452324628829956e-05, -2.135802060365677e-05, -2.026371657848358e-05, -1.9169412553310394e-05, -1.8075108528137207e-05, -1.698080450296402e-05, -1.5886500477790833e-05, -1.4792196452617645e-05, -1.3697892427444458e-05, -1.260358840227127e-05, -1.1509284377098083e-05, -1.0414980351924896e-05, -9.320676326751709e-06, -8.226372301578522e-06, -7.1320682764053345e-06, -6.037764251232147e-06, -4.94346022605896e-06, -3.849156200885773e-06, -2.7548521757125854e-06, -1.6605481505393982e-06, -5.662441253662109e-07, 5.280598998069763e-07, 1.6223639249801636e-06, 2.716667950153351e-06, 3.810971975326538e-06, 4.905276000499725e-06, 5.999580025672913e-06, 7.0938840508461e-06, 8.188188076019287e-06, 9.282492101192474e-06, 1.0376796126365662e-05, 1.1471100151538849e-05, 1.2565404176712036e-05, 1.3659708201885223e-05, 1.475401222705841e-05, 1.5848316252231598e-05, 1.6942620277404785e-05, 1.8036924302577972e-05, 1.913122832775116e-05, 2.0225532352924347e-05, 2.1319836378097534e-05, 2.241414040327072e-05, 2.350844442844391e-05, 2.4602748453617096e-05, 2.5697052478790283e-05, 2.679135650396347e-05, 2.7885660529136658e-05, 2.8979964554309845e-05, 3.0074268579483032e-05, 3.116857260465622e-05, 3.226287662982941e-05, 3.3357180655002594e-05, 3.445148468017578e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 12.0, 10.0, 10.0, 12.0, 17.0, 17.0, 34.0, 14.0, 19.0, 24.0, 28.0, 30.0, 32.0, 33.0, 33.0, 38.0, 40.0, 42.0, 55.0, 39.0, 41.0, 27.0, 37.0, 43.0, 28.0, 36.0, 22.0, 33.0, 25.0, 26.0, 22.0, 15.0, 18.0, 13.0, 13.0, 6.0, 5.0, 7.0, 9.0, 6.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-8.1015625, -7.85565185546875, -7.6097412109375, -7.36383056640625, -7.117919921875, -6.87200927734375, -6.6260986328125, -6.38018798828125, -6.13427734375, -5.88836669921875, -5.6424560546875, -5.39654541015625, -5.150634765625, -4.90472412109375, -4.6588134765625, -4.41290283203125, -4.1669921875, -3.92108154296875, -3.6751708984375, -3.42926025390625, -3.183349609375, -2.93743896484375, -2.6915283203125, -2.44561767578125, -2.19970703125, -1.95379638671875, -1.7078857421875, -1.46197509765625, -1.216064453125, -0.97015380859375, -0.7242431640625, -0.47833251953125, -0.232421875, 0.01348876953125, 0.2593994140625, 0.50531005859375, 0.751220703125, 0.99713134765625, 1.2430419921875, 1.48895263671875, 1.73486328125, 1.98077392578125, 2.2266845703125, 2.47259521484375, 2.718505859375, 2.96441650390625, 3.2103271484375, 3.45623779296875, 3.7021484375, 3.94805908203125, 4.1939697265625, 4.43988037109375, 4.685791015625, 4.93170166015625, 5.1776123046875, 5.42352294921875, 5.66943359375, 5.91534423828125, 6.1612548828125, 6.40716552734375, 6.653076171875, 6.89898681640625, 7.1448974609375, 7.39080810546875, 7.63671875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 14.0, 13.0, 16.0, 27.0, 30.0, 42.0, 59.0, 75.0, 123.0, 188.0, 348.0, 480.0, 916.0, 1678.0, 3140.0, 6229.0, 13461.0, 31061.0, 78224.0, 211313.0, 386303.0, 191128.0, 70820.0, 28100.0, 12194.0, 5851.0, 2912.0, 1556.0, 872.0, 495.0, 306.0, 170.0, 115.0, 79.0, 51.0, 44.0, 33.0, 26.0, 18.0, 15.0, 4.0, 5.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.477783203125, -9.16650390625, -8.855224609375, -8.5439453125, -8.232666015625, -7.92138671875, -7.610107421875, -7.298828125, -6.987548828125, -6.67626953125, -6.364990234375, -6.0537109375, -5.742431640625, -5.43115234375, -5.119873046875, -4.80859375, -4.497314453125, -4.18603515625, -3.874755859375, -3.5634765625, -3.252197265625, -2.94091796875, -2.629638671875, -2.318359375, -2.007080078125, -1.69580078125, -1.384521484375, -1.0732421875, -0.761962890625, -0.45068359375, -0.139404296875, 0.171875, 0.483154296875, 0.79443359375, 1.105712890625, 1.4169921875, 1.728271484375, 2.03955078125, 2.350830078125, 2.662109375, 2.973388671875, 3.28466796875, 3.595947265625, 3.9072265625, 4.218505859375, 4.52978515625, 4.841064453125, 5.15234375, 5.463623046875, 5.77490234375, 6.086181640625, 6.3974609375, 6.708740234375, 7.02001953125, 7.331298828125, 7.642578125, 7.953857421875, 8.26513671875, 8.576416015625, 8.8876953125, 9.198974609375, 9.51025390625, 9.821533203125, 10.1328125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 4.0, 6.0, 15.0, 15.0, 11.0, 15.0, 23.0, 26.0, 25.0, 24.0, 39.0, 47.0, 42.0, 69.0, 70.0, 154.0, 347.0, 1453.0, 175.0, 98.0, 62.0, 61.0, 45.0, 40.0, 29.0, 32.0, 18.0, 15.0, 20.0, 15.0, 12.0, 10.0, 4.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.61767578125, -21.8916015625, -21.16552734375, -20.439453125, -19.71337890625, -18.9873046875, -18.26123046875, -17.53515625, -16.80908203125, -16.0830078125, -15.35693359375, -14.630859375, -13.90478515625, -13.1787109375, -12.45263671875, -11.7265625, -11.00048828125, -10.2744140625, -9.54833984375, -8.822265625, -8.09619140625, -7.3701171875, -6.64404296875, -5.91796875, -5.19189453125, -4.4658203125, -3.73974609375, -3.013671875, -2.28759765625, -1.5615234375, -0.83544921875, -0.109375, 0.61669921875, 1.3427734375, 2.06884765625, 2.794921875, 3.52099609375, 4.2470703125, 4.97314453125, 5.69921875, 6.42529296875, 7.1513671875, 7.87744140625, 8.603515625, 9.32958984375, 10.0556640625, 10.78173828125, 11.5078125, 12.23388671875, 12.9599609375, 13.68603515625, 14.412109375, 15.13818359375, 15.8642578125, 16.59033203125, 17.31640625, 18.04248046875, 18.7685546875, 19.49462890625, 20.220703125, 20.94677734375, 21.6728515625, 22.39892578125, 23.125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 11.0, 9.0, 14.0, 19.0, 23.0, 29.0, 31.0, 65.0, 79.0, 106.0, 181.0, 323.0, 874.0, 8508.0, 3057342.0, 75215.0, 1658.0, 473.0, 222.0, 138.0, 82.0, 58.0, 50.0, 45.0, 26.0, 31.0, 21.0, 21.0, 9.0, 6.0, 8.0, 3.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.40625, -54.681640625, -52.95703125, -51.232421875, -49.5078125, -47.783203125, -46.05859375, -44.333984375, -42.609375, -40.884765625, -39.16015625, -37.435546875, -35.7109375, -33.986328125, -32.26171875, -30.537109375, -28.8125, -27.087890625, -25.36328125, -23.638671875, -21.9140625, -20.189453125, -18.46484375, -16.740234375, -15.015625, -13.291015625, -11.56640625, -9.841796875, -8.1171875, -6.392578125, -4.66796875, -2.943359375, -1.21875, 0.505859375, 2.23046875, 3.955078125, 5.6796875, 7.404296875, 9.12890625, 10.853515625, 12.578125, 14.302734375, 16.02734375, 17.751953125, 19.4765625, 21.201171875, 22.92578125, 24.650390625, 26.375, 28.099609375, 29.82421875, 31.548828125, 33.2734375, 34.998046875, 36.72265625, 38.447265625, 40.171875, 41.896484375, 43.62109375, 45.345703125, 47.0703125, 48.794921875, 50.51953125, 52.244140625, 53.96875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 29.0, 316.0, 560.0, 104.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.35043334960938, -220.06983947753906, -212.78924560546875, -205.50865173339844, -198.22805786132812, -190.9474639892578, -183.6668701171875, -176.3862762451172, -169.10568237304688, -161.82508850097656, -154.54449462890625, -147.26390075683594, -139.98330688476562, -132.7027130126953, -125.422119140625, -118.14152526855469, -110.86093139648438, -103.58033752441406, -96.29974365234375, -89.01914978027344, -81.73855590820312, -74.45796203613281, -67.1773681640625, -59.89677429199219, -52.616180419921875, -45.33558654785156, -38.05499267578125, -30.774398803710938, -23.493804931640625, -16.213211059570312, -8.9326171875, -1.6520233154296875, 5.628570556640625, 12.909164428710938, 20.18975830078125, 27.470352172851562, 34.750946044921875, 42.03153991699219, 49.3121337890625, 56.59272766113281, 63.873321533203125, 71.15391540527344, 78.43450927734375, 85.71510314941406, 92.99569702148438, 100.27629089355469, 107.556884765625, 114.83747863769531, 122.11807250976562, 129.39866638183594, 136.67926025390625, 143.95985412597656, 151.24044799804688, 158.5210418701172, 165.8016357421875, 173.0822296142578, 180.36282348632812, 187.64341735839844, 194.92401123046875, 202.20460510253906, 209.48519897460938, 216.7657928466797, 224.04638671875, 231.3269805908203, 238.60757446289062]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 6.0, 15.0, 13.0, 13.0, 22.0, 19.0, 25.0, 22.0, 25.0, 30.0, 33.0, 26.0, 26.0, 45.0, 29.0, 23.0, 49.0, 48.0, 37.0, 49.0, 36.0, 37.0, 39.0, 32.0, 30.0, 27.0, 33.0, 28.0, 28.0, 17.0, 16.0, 17.0, 9.0, 12.0, 8.0, 16.0, 10.0, 10.0, 6.0, 3.0, 8.0, 6.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-45.65306091308594, -43.89017105102539, -42.12727737426758, -40.36438751220703, -38.60149383544922, -36.83860397338867, -35.075714111328125, -33.31282043457031, -31.549928665161133, -29.787036895751953, -28.024145126342773, -26.261253356933594, -24.498363494873047, -22.735469818115234, -20.972579956054688, -19.209688186645508, -17.446796417236328, -15.683904647827148, -13.921012878417969, -12.158122062683105, -10.395230293273926, -8.632338523864746, -6.869447708129883, -5.106555938720703, -3.3436641693115234, -1.5807726383209229, 0.18211889266967773, 1.9450101852416992, 3.707901954650879, 5.470793724060059, 7.233684539794922, 8.996576309204102, 10.759468078613281, 12.522359848022461, 14.28525161743164, 16.048141479492188, 17.81103515625, 19.573925018310547, 21.336816787719727, 23.099708557128906, 24.862600326538086, 26.625492095947266, 28.388383865356445, 30.151275634765625, 31.914165496826172, 33.677059173583984, 35.43994903564453, 37.202842712402344, 38.96573257446289, 40.72862243652344, 42.49151611328125, 44.2544059753418, 46.01729965209961, 47.780189514160156, 49.54308319091797, 51.305973052978516, 53.06886291503906, 54.83175277709961, 56.59464645385742, 58.35753631591797, 60.12042999267578, 61.88331985473633, 63.646209716796875, 65.40910339355469, 67.1719970703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 14.0, 16.0, 17.0, 20.0, 14.0, 17.0, 22.0, 22.0, 31.0, 36.0, 38.0, 41.0, 44.0, 39.0, 43.0, 40.0, 50.0, 41.0, 36.0, 39.0, 38.0, 31.0, 40.0, 22.0, 27.0, 24.0, 23.0, 35.0, 19.0, 14.0, 13.0, 11.0, 8.0, 8.0, 8.0, 12.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-9.171875, -8.8980712890625, -8.624267578125, -8.3504638671875, -8.07666015625, -7.8028564453125, -7.529052734375, -7.2552490234375, -6.9814453125, -6.7076416015625, -6.433837890625, -6.1600341796875, -5.88623046875, -5.6124267578125, -5.338623046875, -5.0648193359375, -4.791015625, -4.5172119140625, -4.243408203125, -3.9696044921875, -3.69580078125, -3.4219970703125, -3.148193359375, -2.8743896484375, -2.6005859375, -2.3267822265625, -2.052978515625, -1.7791748046875, -1.50537109375, -1.2315673828125, -0.957763671875, -0.6839599609375, -0.41015625, -0.1363525390625, 0.137451171875, 0.4112548828125, 0.68505859375, 0.9588623046875, 1.232666015625, 1.5064697265625, 1.7802734375, 2.0540771484375, 2.327880859375, 2.6016845703125, 2.87548828125, 3.1492919921875, 3.423095703125, 3.6968994140625, 3.970703125, 4.2445068359375, 4.518310546875, 4.7921142578125, 5.06591796875, 5.3397216796875, 5.613525390625, 5.8873291015625, 6.1611328125, 6.4349365234375, 6.708740234375, 6.9825439453125, 7.25634765625, 7.5301513671875, 7.803955078125, 8.0777587890625, 8.3515625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 10.0, 1.0, 15.0, 11.0, 21.0, 28.0, 30.0, 49.0, 67.0, 89.0, 106.0, 144.0, 223.0, 276.0, 438.0, 673.0, 1157.0, 2441.0, 6552.0, 26711.0, 234331.0, 3081548.0, 765709.0, 55262.0, 10701.0, 3519.0, 1493.0, 847.0, 546.0, 351.0, 254.0, 170.0, 132.0, 87.0, 84.0, 74.0, 37.0, 29.0, 24.0, 13.0, 15.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.0458984375, -30.748046875, -29.4501953125, -28.15234375, -26.8544921875, -25.556640625, -24.2587890625, -22.9609375, -21.6630859375, -20.365234375, -19.0673828125, -17.76953125, -16.4716796875, -15.173828125, -13.8759765625, -12.578125, -11.2802734375, -9.982421875, -8.6845703125, -7.38671875, -6.0888671875, -4.791015625, -3.4931640625, -2.1953125, -0.8974609375, 0.400390625, 1.6982421875, 2.99609375, 4.2939453125, 5.591796875, 6.8896484375, 8.1875, 9.4853515625, 10.783203125, 12.0810546875, 13.37890625, 14.6767578125, 15.974609375, 17.2724609375, 18.5703125, 19.8681640625, 21.166015625, 22.4638671875, 23.76171875, 25.0595703125, 26.357421875, 27.6552734375, 28.953125, 30.2509765625, 31.548828125, 32.8466796875, 34.14453125, 35.4423828125, 36.740234375, 38.0380859375, 39.3359375, 40.6337890625, 41.931640625, 43.2294921875, 44.52734375, 45.8251953125, 47.123046875, 48.4208984375, 49.71875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 8.0, 8.0, 6.0, 12.0, 12.0, 16.0, 41.0, 42.0, 67.0, 88.0, 103.0, 138.0, 176.0, 269.0, 389.0, 508.0, 531.0, 404.0, 308.0, 190.0, 171.0, 112.0, 96.0, 90.0, 73.0, 44.0, 39.0, 33.0, 22.0, 14.0, 11.0, 14.0, 5.0, 4.0, 5.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.53857421875, -14.9208984375, -14.30322265625, -13.685546875, -13.06787109375, -12.4501953125, -11.83251953125, -11.21484375, -10.59716796875, -9.9794921875, -9.36181640625, -8.744140625, -8.12646484375, -7.5087890625, -6.89111328125, -6.2734375, -5.65576171875, -5.0380859375, -4.42041015625, -3.802734375, -3.18505859375, -2.5673828125, -1.94970703125, -1.33203125, -0.71435546875, -0.0966796875, 0.52099609375, 1.138671875, 1.75634765625, 2.3740234375, 2.99169921875, 3.609375, 4.22705078125, 4.8447265625, 5.46240234375, 6.080078125, 6.69775390625, 7.3154296875, 7.93310546875, 8.55078125, 9.16845703125, 9.7861328125, 10.40380859375, 11.021484375, 11.63916015625, 12.2568359375, 12.87451171875, 13.4921875, 14.10986328125, 14.7275390625, 15.34521484375, 15.962890625, 16.58056640625, 17.1982421875, 17.81591796875, 18.43359375, 19.05126953125, 19.6689453125, 20.28662109375, 20.904296875, 21.52197265625, 22.1396484375, 22.75732421875, 23.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 8.0, 8.0, 15.0, 16.0, 28.0, 26.0, 43.0, 46.0, 75.0, 121.0, 251.0, 528.0, 1615.0, 7829.0, 77028.0, 2586029.0, 1460427.0, 52144.0, 5894.0, 1256.0, 404.0, 175.0, 93.0, 49.0, 42.0, 26.0, 21.0, 16.0, 9.0, 12.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.71875, -49.17822265625, -47.6376953125, -46.09716796875, -44.556640625, -43.01611328125, -41.4755859375, -39.93505859375, -38.39453125, -36.85400390625, -35.3134765625, -33.77294921875, -32.232421875, -30.69189453125, -29.1513671875, -27.61083984375, -26.0703125, -24.52978515625, -22.9892578125, -21.44873046875, -19.908203125, -18.36767578125, -16.8271484375, -15.28662109375, -13.74609375, -12.20556640625, -10.6650390625, -9.12451171875, -7.583984375, -6.04345703125, -4.5029296875, -2.96240234375, -1.421875, 0.11865234375, 1.6591796875, 3.19970703125, 4.740234375, 6.28076171875, 7.8212890625, 9.36181640625, 10.90234375, 12.44287109375, 13.9833984375, 15.52392578125, 17.064453125, 18.60498046875, 20.1455078125, 21.68603515625, 23.2265625, 24.76708984375, 26.3076171875, 27.84814453125, 29.388671875, 30.92919921875, 32.4697265625, 34.01025390625, 35.55078125, 37.09130859375, 38.6318359375, 40.17236328125, 41.712890625, 43.25341796875, 44.7939453125, 46.33447265625, 47.875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 14.0, 27.0, 27.0, 54.0, 69.0, 94.0, 118.0, 125.0, 105.0, 99.0, 60.0, 54.0, 45.0, 23.0, 18.0, 9.0, 10.0, 8.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.996826171875, -159.96437072753906, -153.93190002441406, -147.89944458007812, -141.86697387695312, -135.8345184326172, -129.80206298828125, -123.76959228515625, -117.73712921142578, -111.70466613769531, -105.67220306396484, -99.63973999023438, -93.60728454589844, -87.57481384277344, -81.5423583984375, -75.50989532470703, -69.47743225097656, -63.444969177246094, -57.412506103515625, -51.38004684448242, -45.34758377075195, -39.315120697021484, -33.28266143798828, -27.250198364257812, -21.217735290527344, -15.185273170471191, -9.152811050415039, -3.120349884033203, 2.9121131896972656, 8.944576263427734, 14.977035522460938, 21.009498596191406, 27.041946411132812, 33.07440948486328, 39.10687255859375, 45.13933181762695, 51.17179489135742, 57.20425796508789, 63.236717224121094, 69.26918029785156, 75.30164337158203, 81.3341064453125, 87.36656951904297, 93.39903259277344, 99.43148803710938, 105.46395874023438, 111.49641418457031, 117.52887725830078, 123.56134033203125, 129.5937957763672, 135.6262664794922, 141.65872192382812, 147.69119262695312, 153.72364807128906, 159.756103515625, 165.78857421875, 171.821044921875, 177.85350036621094, 183.88597106933594, 189.91842651367188, 195.95089721679688, 201.9833526611328, 208.01580810546875, 214.04827880859375, 220.0807342529297]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 10.0, 10.0, 9.0, 12.0, 31.0, 15.0, 23.0, 16.0, 32.0, 39.0, 36.0, 35.0, 42.0, 52.0, 45.0, 51.0, 48.0, 48.0, 47.0, 56.0, 51.0, 44.0, 40.0, 31.0, 34.0, 30.0, 29.0, 19.0, 12.0, 17.0, 8.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-135.88218688964844, -131.83721923828125, -127.79224395751953, -123.74726867675781, -119.70230102539062, -115.6573257446289, -111.61235046386719, -107.5673828125, -103.52240753173828, -99.47743225097656, -95.43246459960938, -91.38748931884766, -87.34251403808594, -83.29754638671875, -79.25257110595703, -75.20759582519531, -71.16262817382812, -67.1176528930664, -63.07268524169922, -59.0277099609375, -54.98273849487305, -50.937767028808594, -46.892791748046875, -42.84782028198242, -38.80284881591797, -34.757877349853516, -30.71290397644043, -26.667930603027344, -22.62295913696289, -18.577987670898438, -14.533014297485352, -10.488040924072266, -6.443084716796875, -2.3981122970581055, 1.646860122680664, 5.691832542419434, 9.736804962158203, 13.781776428222656, 17.826749801635742, 21.871723175048828, 25.91669464111328, 29.961666107177734, 34.00663757324219, 38.051612854003906, 42.09658432006836, 46.14155578613281, 50.18653106689453, 54.231502532958984, 58.27647399902344, 62.32144546508789, 66.36641693115234, 70.41139221191406, 74.45635986328125, 78.50133514404297, 82.54631042480469, 86.59127807617188, 90.6362533569336, 94.68122863769531, 98.7261962890625, 102.77117156982422, 106.81614685058594, 110.86111450195312, 114.90608978271484, 118.95106506347656, 122.99603271484375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 8.0, 4.0, 5.0, 12.0, 9.0, 18.0, 19.0, 17.0, 23.0, 21.0, 24.0, 31.0, 25.0, 43.0, 28.0, 45.0, 48.0, 48.0, 52.0, 30.0, 46.0, 39.0, 48.0, 54.0, 37.0, 42.0, 31.0, 32.0, 27.0, 27.0, 26.0, 18.0, 10.0, 13.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-219.125, -212.92578125, -206.7265625, -200.52734375, -194.328125, -188.12890625, -181.9296875, -175.73046875, -169.53125, -163.33203125, -157.1328125, -150.93359375, -144.734375, -138.53515625, -132.3359375, -126.13671875, -119.9375, -113.73828125, -107.5390625, -101.33984375, -95.140625, -88.94140625, -82.7421875, -76.54296875, -70.34375, -64.14453125, -57.9453125, -51.74609375, -45.546875, -39.34765625, -33.1484375, -26.94921875, -20.75, -14.55078125, -8.3515625, -2.15234375, 4.046875, 10.24609375, 16.4453125, 22.64453125, 28.84375, 35.04296875, 41.2421875, 47.44140625, 53.640625, 59.83984375, 66.0390625, 72.23828125, 78.4375, 84.63671875, 90.8359375, 97.03515625, 103.234375, 109.43359375, 115.6328125, 121.83203125, 128.03125, 134.23046875, 140.4296875, 146.62890625, 152.828125, 159.02734375, 165.2265625, 171.42578125, 177.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 9.0, 9.0, 17.0, 32.0, 39.0, 53.0, 83.0, 112.0, 174.0, 232.0, 339.0, 530.0, 779.0, 1230.0, 1766.0, 2822.0, 4329.0, 6865.0, 10841.0, 17315.0, 28731.0, 48789.0, 90531.0, 191406.0, 331684.0, 138101.0, 69975.0, 38967.0, 23186.0, 14350.0, 8888.0, 5663.0, 3646.0, 2357.0, 1534.0, 1042.0, 698.0, 437.0, 306.0, 234.0, 133.0, 100.0, 71.0, 35.0, 35.0, 26.0, 18.0, 14.0, 10.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.816650390625, -16.24267578125, -15.668701171875, -15.0947265625, -14.520751953125, -13.94677734375, -13.372802734375, -12.798828125, -12.224853515625, -11.65087890625, -11.076904296875, -10.5029296875, -9.928955078125, -9.35498046875, -8.781005859375, -8.20703125, -7.633056640625, -7.05908203125, -6.485107421875, -5.9111328125, -5.337158203125, -4.76318359375, -4.189208984375, -3.615234375, -3.041259765625, -2.46728515625, -1.893310546875, -1.3193359375, -0.745361328125, -0.17138671875, 0.402587890625, 0.9765625, 1.550537109375, 2.12451171875, 2.698486328125, 3.2724609375, 3.846435546875, 4.42041015625, 4.994384765625, 5.568359375, 6.142333984375, 6.71630859375, 7.290283203125, 7.8642578125, 8.438232421875, 9.01220703125, 9.586181640625, 10.16015625, 10.734130859375, 11.30810546875, 11.882080078125, 12.4560546875, 13.030029296875, 13.60400390625, 14.177978515625, 14.751953125, 15.325927734375, 15.89990234375, 16.473876953125, 17.0478515625, 17.621826171875, 18.19580078125, 18.769775390625, 19.34375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 5.0, 11.0, 11.0, 12.0, 14.0, 16.0, 35.0, 23.0, 29.0, 31.0, 40.0, 31.0, 37.0, 37.0, 36.0, 42.0, 35.0, 1073.0, 55.0, 51.0, 45.0, 46.0, 48.0, 39.0, 27.0, 31.0, 32.0, 28.0, 21.0, 14.0, 20.0, 14.0, 9.0, 4.0, 5.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-165.875, -160.669921875, -155.46484375, -150.259765625, -145.0546875, -139.849609375, -134.64453125, -129.439453125, -124.234375, -119.029296875, -113.82421875, -108.619140625, -103.4140625, -98.208984375, -93.00390625, -87.798828125, -82.59375, -77.388671875, -72.18359375, -66.978515625, -61.7734375, -56.568359375, -51.36328125, -46.158203125, -40.953125, -35.748046875, -30.54296875, -25.337890625, -20.1328125, -14.927734375, -9.72265625, -4.517578125, 0.6875, 5.892578125, 11.09765625, 16.302734375, 21.5078125, 26.712890625, 31.91796875, 37.123046875, 42.328125, 47.533203125, 52.73828125, 57.943359375, 63.1484375, 68.353515625, 73.55859375, 78.763671875, 83.96875, 89.173828125, 94.37890625, 99.583984375, 104.7890625, 109.994140625, 115.19921875, 120.404296875, 125.609375, 130.814453125, 136.01953125, 141.224609375, 146.4296875, 151.634765625, 156.83984375, 162.044921875, 167.25]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 7.0, 13.0, 9.0, 17.0, 32.0, 41.0, 58.0, 75.0, 119.0, 191.0, 292.0, 464.0, 661.0, 1131.0, 1816.0, 2827.0, 4729.0, 8211.0, 13740.0, 24468.0, 44889.0, 88245.0, 214708.0, 1433732.0, 122955.0, 58787.0, 31426.0, 17530.0, 10212.0, 6048.0, 3663.0, 2164.0, 1419.0, 880.0, 542.0, 347.0, 223.0, 135.0, 121.0, 77.0, 40.0, 26.0, 23.0, 10.0, 12.0, 12.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.9007568359375, -10.551513671875, -10.2022705078125, -9.85302734375, -9.5037841796875, -9.154541015625, -8.8052978515625, -8.4560546875, -8.1068115234375, -7.757568359375, -7.4083251953125, -7.05908203125, -6.7098388671875, -6.360595703125, -6.0113525390625, -5.662109375, -5.3128662109375, -4.963623046875, -4.6143798828125, -4.26513671875, -3.9158935546875, -3.566650390625, -3.2174072265625, -2.8681640625, -2.5189208984375, -2.169677734375, -1.8204345703125, -1.47119140625, -1.1219482421875, -0.772705078125, -0.4234619140625, -0.07421875, 0.2750244140625, 0.624267578125, 0.9735107421875, 1.32275390625, 1.6719970703125, 2.021240234375, 2.3704833984375, 2.7197265625, 3.0689697265625, 3.418212890625, 3.7674560546875, 4.11669921875, 4.4659423828125, 4.815185546875, 5.1644287109375, 5.513671875, 5.8629150390625, 6.212158203125, 6.5614013671875, 6.91064453125, 7.2598876953125, 7.609130859375, 7.9583740234375, 8.3076171875, 8.6568603515625, 9.006103515625, 9.3553466796875, 9.70458984375, 10.0538330078125, 10.403076171875, 10.7523193359375, 11.1015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 4.0, 8.0, 8.0, 14.0, 13.0, 19.0, 13.0, 17.0, 25.0, 33.0, 26.0, 50.0, 49.0, 55.0, 63.0, 54.0, 70.0, 64.0, 64.0, 52.0, 55.0, 43.0, 40.0, 29.0, 15.0, 27.0, 12.0, 13.0, 17.0, 8.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00251007080078125, -0.002418339252471924, -0.0023266077041625977, -0.0022348761558532715, -0.0021431446075439453, -0.002051413059234619, -0.001959681510925293, -0.0018679499626159668, -0.0017762184143066406, -0.0016844868659973145, -0.0015927553176879883, -0.0015010237693786621, -0.001409292221069336, -0.0013175606727600098, -0.0012258291244506836, -0.0011340975761413574, -0.0010423660278320312, -0.0009506344795227051, -0.0008589029312133789, -0.0007671713829040527, -0.0006754398345947266, -0.0005837082862854004, -0.0004919767379760742, -0.00040024518966674805, -0.0003085136413574219, -0.0002167820930480957, -0.00012505054473876953, -3.331899642944336e-05, 5.841255187988281e-05, 0.00015014410018920898, 0.00024187564849853516, 0.00033360719680786133, 0.0004253387451171875, 0.0005170702934265137, 0.0006088018417358398, 0.000700533390045166, 0.0007922649383544922, 0.0008839964866638184, 0.0009757280349731445, 0.0010674595832824707, 0.0011591911315917969, 0.001250922679901123, 0.0013426542282104492, 0.0014343857765197754, 0.0015261173248291016, 0.0016178488731384277, 0.001709580421447754, 0.00180131196975708, 0.0018930435180664062, 0.0019847750663757324, 0.0020765066146850586, 0.0021682381629943848, 0.002259969711303711, 0.002351701259613037, 0.0024434328079223633, 0.0025351643562316895, 0.0026268959045410156, 0.002718627452850342, 0.002810359001159668, 0.002902090549468994, 0.0029938220977783203, 0.0030855536460876465, 0.0031772851943969727, 0.003269016742706299, 0.003360748291015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 12.0, 17.0, 33.0, 40.0, 59.0, 79.0, 145.0, 216.0, 321.0, 606.0, 1204.0, 2470.0, 6011.0, 17200.0, 61158.0, 352974.0, 498801.0, 74414.0, 20267.0, 6770.0, 2761.0, 1242.0, 709.0, 377.0, 187.0, 160.0, 116.0, 42.0, 52.0, 28.0, 28.0, 12.0, 12.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0144805908203125, -0.013998985290527344, -0.013517379760742188, -0.013035774230957031, -0.012554168701171875, -0.012072563171386719, -0.011590957641601562, -0.011109352111816406, -0.01062774658203125, -0.010146141052246094, -0.009664535522460938, -0.009182929992675781, -0.008701324462890625, -0.008219718933105469, -0.0077381134033203125, -0.007256507873535156, -0.00677490234375, -0.006293296813964844, -0.0058116912841796875, -0.005330085754394531, -0.004848480224609375, -0.004366874694824219, -0.0038852691650390625, -0.0034036636352539062, -0.00292205810546875, -0.0024404525756835938, -0.0019588470458984375, -0.0014772415161132812, -0.000995635986328125, -0.0005140304565429688, -3.24249267578125e-05, 0.00044918060302734375, 0.0009307861328125, 0.0014123916625976562, 0.0018939971923828125, 0.0023756027221679688, 0.002857208251953125, 0.0033388137817382812, 0.0038204193115234375, 0.004302024841308594, 0.00478363037109375, 0.005265235900878906, 0.0057468414306640625, 0.006228446960449219, 0.006710052490234375, 0.007191658020019531, 0.0076732635498046875, 0.008154869079589844, 0.008636474609375, 0.009118080139160156, 0.009599685668945312, 0.010081291198730469, 0.010562896728515625, 0.011044502258300781, 0.011526107788085938, 0.012007713317871094, 0.01248931884765625, 0.012970924377441406, 0.013452529907226562, 0.013934135437011719, 0.014415740966796875, 0.014897346496582031, 0.015378952026367188, 0.015860557556152344, 0.0163421630859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 8.0, 13.0, 25.0, 38.0, 41.0, 76.0, 113.0, 160.0, 196.0, 130.0, 65.0, 46.0, 24.0, 17.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 4.0], "bins": [-0.005109437741339207, -0.005009548272937536, -0.004909659270197153, -0.004809769801795483, -0.004709880333393812, -0.004609991330653429, -0.004510101862251759, -0.004410212859511375, -0.004310323391109705, -0.0042104339227080345, -0.004110544919967651, -0.004010655451565981, -0.0039107659831643105, -0.0038108769804239273, -0.003710987512022257, -0.00361109827645123, -0.0035112090408802032, -0.0034113198053091764, -0.003311430336907506, -0.003211541101336479, -0.0031116518657654524, -0.0030117626301944256, -0.002911873161792755, -0.0028119839262217283, -0.002712094457820058, -0.002612205222249031, -0.0025123157538473606, -0.002412426518276334, -0.002312537282705307, -0.0022126478143036366, -0.0021127585787326097, -0.002012869343161583, -0.0019129799911752343, -0.0018130906391888857, -0.0017132014036178589, -0.0016133120516315103, -0.0015134228160604835, -0.0014135334640741348, -0.001313644228503108, -0.0012137548765167594, -0.0011138655245304108, -0.0010139761725440621, -0.0009140869369730353, -0.0008141975849866867, -0.0007143083494156599, -0.0006144189974293113, -0.0005145297036506236, -0.00041464040987193584, -0.00031475117430090904, -0.00021486188052222133, -0.00011497257219161838, -1.5083263861015439e-05, 8.480602991767228e-05, 0.00018469535280019045, 0.00028458464657887816, 0.0003844739403575659, 0.0004843632341362536, 0.0005842525279149413, 0.000684141821693629, 0.0007840311154723167, 0.0008839204674586654, 0.000983809819445014, 0.0010836990550160408, 0.0011835882905870676, 0.0012834776425734162]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 11.0, 10.0, 15.0, 17.0, 14.0, 20.0, 27.0, 26.0, 29.0, 26.0, 40.0, 37.0, 50.0, 53.0, 34.0, 46.0, 57.0, 43.0, 35.0, 38.0, 34.0, 33.0, 31.0, 32.0, 28.0, 22.0, 32.0, 31.0, 18.0, 15.0, 16.0, 12.0, 13.0, 6.0, 7.0, 9.0, 6.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018625259399414062, -0.001807444728910923, -0.0017523635178804398, -0.0016972823068499565, -0.0016422010958194733, -0.00158711988478899, -0.0015320386737585068, -0.0014769574627280235, -0.0014218762516975403, -0.001366795040667057, -0.0013117138296365738, -0.0012566326186060905, -0.0012015514075756073, -0.001146470196545124, -0.0010913889855146408, -0.0010363077744841576, -0.0009812265634536743, -0.0009261453524231911, -0.0008710641413927078, -0.0008159829303622246, -0.0007609017193317413, -0.0007058205083012581, -0.0006507392972707748, -0.0005956580862402916, -0.0005405768752098083, -0.0004854956641793251, -0.00043041445314884186, -0.0003753332421183586, -0.00032025203108787537, -0.0002651708200573921, -0.00021008960902690887, -0.00015500839799642563, -9.992718696594238e-05, -4.484597593545914e-05, 1.0235235095024109e-05, 6.531644612550735e-05, 0.0001203976571559906, 0.00017547886818647385, 0.0002305600792169571, 0.00028564129024744034, 0.0003407225012779236, 0.00039580371230840683, 0.0004508849233388901, 0.0005059661343693733, 0.0005610473453998566, 0.0006161285564303398, 0.0006712097674608231, 0.0007262909784913063, 0.0007813721895217896, 0.0008364534005522728, 0.000891534611582756, 0.0009466158226132393, 0.0010016970336437225, 0.0010567782446742058, 0.001111859455704689, 0.0011669406667351723, 0.0012220218777656555, 0.0012771030887961388, 0.001332184299826622, 0.0013872655108571053, 0.0014423467218875885, 0.0014974279329180717, 0.001552509143948555, 0.0016075903549790382, 0.0016626715660095215]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 8.0, 4.0, 5.0, 12.0, 9.0, 18.0, 19.0, 17.0, 23.0, 21.0, 24.0, 31.0, 25.0, 43.0, 28.0, 45.0, 48.0, 48.0, 52.0, 30.0, 46.0, 39.0, 48.0, 53.0, 38.0, 42.0, 31.0, 32.0, 27.0, 27.0, 26.0, 17.0, 11.0, 13.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-219.125, -212.92578125, -206.7265625, -200.52734375, -194.328125, -188.12890625, -181.9296875, -175.73046875, -169.53125, -163.33203125, -157.1328125, -150.93359375, -144.734375, -138.53515625, -132.3359375, -126.13671875, -119.9375, -113.73828125, -107.5390625, -101.33984375, -95.140625, -88.94140625, -82.7421875, -76.54296875, -70.34375, -64.14453125, -57.9453125, -51.74609375, -45.546875, -39.34765625, -33.1484375, -26.94921875, -20.75, -14.55078125, -8.3515625, -2.15234375, 4.046875, 10.24609375, 16.4453125, 22.64453125, 28.84375, 35.04296875, 41.2421875, 47.44140625, 53.640625, 59.83984375, 66.0390625, 72.23828125, 78.4375, 84.63671875, 90.8359375, 97.03515625, 103.234375, 109.43359375, 115.6328125, 121.83203125, 128.03125, 134.23046875, 140.4296875, 146.62890625, 152.828125, 159.02734375, 165.2265625, 171.42578125, 177.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 7.0, 5.0, 9.0, 10.0, 12.0, 23.0, 25.0, 32.0, 32.0, 55.0, 91.0, 154.0, 331.0, 768.0, 2158.0, 7030.0, 29010.0, 148006.0, 535256.0, 259061.0, 49906.0, 11254.0, 3227.0, 1096.0, 441.0, 196.0, 128.0, 55.0, 43.0, 34.0, 23.0, 12.0, 16.0, 8.0, 14.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-42.96875, -41.76416015625, -40.5595703125, -39.35498046875, -38.150390625, -36.94580078125, -35.7412109375, -34.53662109375, -33.33203125, -32.12744140625, -30.9228515625, -29.71826171875, -28.513671875, -27.30908203125, -26.1044921875, -24.89990234375, -23.6953125, -22.49072265625, -21.2861328125, -20.08154296875, -18.876953125, -17.67236328125, -16.4677734375, -15.26318359375, -14.05859375, -12.85400390625, -11.6494140625, -10.44482421875, -9.240234375, -8.03564453125, -6.8310546875, -5.62646484375, -4.421875, -3.21728515625, -2.0126953125, -0.80810546875, 0.396484375, 1.60107421875, 2.8056640625, 4.01025390625, 5.21484375, 6.41943359375, 7.6240234375, 8.82861328125, 10.033203125, 11.23779296875, 12.4423828125, 13.64697265625, 14.8515625, 16.05615234375, 17.2607421875, 18.46533203125, 19.669921875, 20.87451171875, 22.0791015625, 23.28369140625, 24.48828125, 25.69287109375, 26.8974609375, 28.10205078125, 29.306640625, 30.51123046875, 31.7158203125, 32.92041015625, 34.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 5.0, 16.0, 15.0, 24.0, 31.0, 59.0, 54.0, 76.0, 94.0, 101.0, 2129.0, 91.0, 86.0, 71.0, 55.0, 35.0, 31.0, 25.0, 17.0, 16.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-453.75, -435.75390625, -417.7578125, -399.76171875, -381.765625, -363.76953125, -345.7734375, -327.77734375, -309.78125, -291.78515625, -273.7890625, -255.79296875, -237.796875, -219.80078125, -201.8046875, -183.80859375, -165.8125, -147.81640625, -129.8203125, -111.82421875, -93.828125, -75.83203125, -57.8359375, -39.83984375, -21.84375, -3.84765625, 14.1484375, 32.14453125, 50.140625, 68.13671875, 86.1328125, 104.12890625, 122.125, 140.12109375, 158.1171875, 176.11328125, 194.109375, 212.10546875, 230.1015625, 248.09765625, 266.09375, 284.08984375, 302.0859375, 320.08203125, 338.078125, 356.07421875, 374.0703125, 392.06640625, 410.0625, 428.05859375, 446.0546875, 464.05078125, 482.046875, 500.04296875, 518.0390625, 536.03515625, 554.03125, 572.02734375, 590.0234375, 608.01953125, 626.015625, 644.01171875, 662.0078125, 680.00390625, 698.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 9.0, 16.0, 7.0, 25.0, 31.0, 33.0, 73.0, 114.0, 189.0, 333.0, 606.0, 1294.0, 3748.0, 18055.0, 210309.0, 2827116.0, 70482.0, 8908.0, 2316.0, 853.0, 488.0, 276.0, 150.0, 95.0, 59.0, 36.0, 21.0, 13.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.96875, -48.59228515625, -47.2158203125, -45.83935546875, -44.462890625, -43.08642578125, -41.7099609375, -40.33349609375, -38.95703125, -37.58056640625, -36.2041015625, -34.82763671875, -33.451171875, -32.07470703125, -30.6982421875, -29.32177734375, -27.9453125, -26.56884765625, -25.1923828125, -23.81591796875, -22.439453125, -21.06298828125, -19.6865234375, -18.31005859375, -16.93359375, -15.55712890625, -14.1806640625, -12.80419921875, -11.427734375, -10.05126953125, -8.6748046875, -7.29833984375, -5.921875, -4.54541015625, -3.1689453125, -1.79248046875, -0.416015625, 0.96044921875, 2.3369140625, 3.71337890625, 5.08984375, 6.46630859375, 7.8427734375, 9.21923828125, 10.595703125, 11.97216796875, 13.3486328125, 14.72509765625, 16.1015625, 17.47802734375, 18.8544921875, 20.23095703125, 21.607421875, 22.98388671875, 24.3603515625, 25.73681640625, 27.11328125, 28.48974609375, 29.8662109375, 31.24267578125, 32.619140625, 33.99560546875, 35.3720703125, 36.74853515625, 38.125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 13.0, 33.0, 67.0, 231.0, 352.0, 148.0, 74.0, 25.0, 24.0, 10.0, 8.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-826.6935424804688, -791.2064208984375, -755.7192993164062, -720.232177734375, -684.7450561523438, -649.2579345703125, -613.7708740234375, -578.28369140625, -542.796630859375, -507.30950927734375, -471.8223876953125, -436.33526611328125, -400.84814453125, -365.36102294921875, -329.8739318847656, -294.3868103027344, -258.899658203125, -223.41253662109375, -187.9254150390625, -152.4383087158203, -116.95118713378906, -81.46406555175781, -45.976959228515625, -10.489837646484375, 24.997283935546875, 60.48440170288086, 95.97151947021484, 131.45863342285156, 166.9457550048828, 202.43287658691406, 237.91998291015625, 273.4071044921875, 308.894287109375, 344.38140869140625, 379.8685302734375, 415.35565185546875, 450.8427734375, 486.32989501953125, 521.8170166015625, 557.3040771484375, 592.791259765625, 628.2783813476562, 663.7655029296875, 699.2526245117188, 734.73974609375, 770.2268676757812, 805.7139892578125, 841.2010498046875, 876.6881713867188, 912.17529296875, 947.6624145507812, 983.1495361328125, 1018.6366577148438, 1054.123779296875, 1089.61083984375, 1125.0980224609375, 1160.5850830078125, 1196.0721435546875, 1231.559326171875, 1267.04638671875, 1302.5335693359375, 1338.0206298828125, 1373.5078125, 1408.994873046875, 1444.4820556640625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 6.0, 7.0, 6.0, 19.0, 12.0, 12.0, 11.0, 21.0, 22.0, 23.0, 35.0, 31.0, 56.0, 38.0, 44.0, 52.0, 52.0, 53.0, 49.0, 39.0, 33.0, 40.0, 30.0, 38.0, 35.0, 39.0, 30.0, 30.0, 18.0, 19.0, 21.0, 15.0, 21.0, 10.0, 6.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0], "bins": [-764.2469482421875, -744.0936279296875, -723.9403686523438, -703.7870483398438, -683.6337890625, -663.48046875, -643.3272094726562, -623.1738891601562, -603.0206298828125, -582.8673095703125, -562.7140502929688, -542.5607299804688, -522.407470703125, -502.254150390625, -482.1008605957031, -461.94757080078125, -441.79425048828125, -421.6409606933594, -401.4876708984375, -381.3343811035156, -361.18109130859375, -341.02777099609375, -320.8744812011719, -300.72119140625, -280.5679016113281, -260.41461181640625, -240.26132202148438, -220.10801696777344, -199.95472717285156, -179.8014373779297, -159.64813232421875, -139.49484252929688, -119.341552734375, -99.18826293945312, -79.03496551513672, -58.88167190551758, -38.72837829589844, -18.575088500976562, 1.5782089233398438, 21.73150634765625, 41.884796142578125, 62.038089752197266, 82.1913833618164, 102.34468078613281, 122.49797058105469, 142.65126037597656, 162.8045654296875, 182.95785522460938, 203.11114501953125, 223.26443481445312, 243.417724609375, 263.5710144042969, 283.72430419921875, 303.87762451171875, 324.0309143066406, 344.1842041015625, 364.3374938964844, 384.49078369140625, 404.6440734863281, 424.79736328125, 444.95068359375, 465.10394287109375, 485.25726318359375, 505.4105529785156, 525.5638427734375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 12.0, 6.0, 9.0, 14.0, 9.0, 23.0, 26.0, 24.0, 33.0, 74.0, 70.0, 84.0, 126.0, 170.0, 230.0, 273.0, 392.0, 497.0, 746.0, 981.0, 1040567.0, 1060.0, 801.0, 561.0, 434.0, 315.0, 239.0, 185.0, 137.0, 107.0, 85.0, 68.0, 47.0, 42.0, 24.0, 25.0, 16.0, 9.0, 6.0, 6.0, 9.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-127.15357208251953, -123.48319244384766, -119.81281280517578, -116.1424331665039, -112.47205352783203, -108.80167388916016, -105.13130187988281, -101.46092224121094, -97.79054260253906, -94.12016296386719, -90.44978332519531, -86.77940368652344, -83.10902404785156, -79.43864440917969, -75.76826477050781, -72.09788513183594, -68.42750549316406, -64.75712585449219, -61.08674621582031, -57.41636657714844, -53.74598693847656, -50.07560729980469, -46.40523147583008, -42.7348518371582, -39.06447219848633, -35.39409255981445, -31.723712921142578, -28.053335189819336, -24.38295555114746, -20.712575912475586, -17.042198181152344, -13.371818542480469, -9.701431274414062, -6.031052112579346, -2.360672950744629, 1.3097057342529297, 4.980085372924805, 8.65046501159668, 12.320842742919922, 15.991222381591797, 19.661602020263672, 23.331981658935547, 27.002361297607422, 30.672739028930664, 34.343116760253906, 38.01349639892578, 41.683876037597656, 45.35425567626953, 49.024635314941406, 52.69501495361328, 56.365394592285156, 60.03577423095703, 63.706153869628906, 67.37653350830078, 71.04690551757812, 74.71728515625, 78.38766479492188, 82.05804443359375, 85.72842407226562, 89.3988037109375, 93.06918334960938, 96.73956298828125, 100.40994262695312, 104.080322265625, 107.75070190429688]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 11.0, 14.0, 16.0, 17.0, 32.0, 52.0, 110.0, 499.0, 12219.0, 51447484.0, 2253.0, 237.0, 73.0, 25.0, 11.0, 10.0, 9.0, 15.0, 11.0, 4.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1316.0, -1273.97265625, -1231.9453125, -1189.91796875, -1147.890625, -1105.8634033203125, -1063.8360595703125, -1021.8087158203125, -979.7813720703125, -937.7540283203125, -895.7266845703125, -853.6994018554688, -811.6720581054688, -769.6447143554688, -727.617431640625, -685.590087890625, -643.562744140625, -601.535400390625, -559.508056640625, -517.4807739257812, -475.45343017578125, -433.42608642578125, -391.3987731933594, -349.3714599609375, -307.3441162109375, -265.3167724609375, -223.28945922851562, -181.2621307373047, -139.23480224609375, -97.20747375488281, -55.180145263671875, -13.15283203125, 28.8746337890625, 70.90196228027344, 112.92929077148438, 154.9566192626953, 196.98394775390625, 239.0112762451172, 281.0386047363281, 323.06591796875, 365.09326171875, 407.12060546875, 449.1479187011719, 491.17523193359375, 533.2025756835938, 575.2299194335938, 617.2572021484375, 659.2845458984375, 701.3118896484375, 743.3392333984375, 785.3665771484375, 827.3938598632812, 869.4212036132812, 911.4485473632812, 953.475830078125, 995.503173828125, 1037.530517578125, 1079.557861328125, 1121.585205078125, 1163.612548828125, 1205.639892578125, 1247.6671142578125, 1289.6944580078125, 1331.7218017578125, 1373.7491455078125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [8.0, 7.0, 15.0, 19.0, 31.0, 31.0, 43.0, 65.0, 91.0, 167.0, 228.0, 309.0, 409.0, 556.0, 784.0, 1206.0, 1687.0, 2397.0, 3355.0, 4872.0, 7088.0, 10659.0, 15641.0, 23310.0, 34902.0, 53459.0, 80996.0, 125949.0, 202203.0, 355785.0, 4041964.0, 579701.0, 272949.0, 163953.0, 103829.0, 67559.0, 43653.0, 29166.0, 19665.0, 13325.0, 8872.0, 6439.0, 4244.0, 3013.0, 2025.0, 1381.0, 1056.0, 771.0, 501.0, 351.0, 218.0, 140.0, 113.0, 99.0, 75.0, 50.0, 28.0, 20.0, 13.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.396484375, -2.318634033203125, -2.24078369140625, -2.162933349609375, -2.0850830078125, -2.007232666015625, -1.92938232421875, -1.851531982421875, -1.773681640625, -1.695831298828125, -1.61798095703125, -1.540130615234375, -1.4622802734375, -1.384429931640625, -1.30657958984375, -1.228729248046875, -1.15087890625, -1.073028564453125, -0.99517822265625, -0.917327880859375, -0.8394775390625, -0.761627197265625, -0.68377685546875, -0.605926513671875, -0.528076171875, -0.450225830078125, -0.37237548828125, -0.294525146484375, -0.2166748046875, -0.138824462890625, -0.06097412109375, 0.016876220703125, 0.0947265625, 0.172576904296875, 0.25042724609375, 0.328277587890625, 0.4061279296875, 0.483978271484375, 0.56182861328125, 0.639678955078125, 0.717529296875, 0.795379638671875, 0.87322998046875, 0.951080322265625, 1.0289306640625, 1.106781005859375, 1.18463134765625, 1.262481689453125, 1.34033203125, 1.418182373046875, 1.49603271484375, 1.573883056640625, 1.6517333984375, 1.729583740234375, 1.80743408203125, 1.885284423828125, 1.963134765625, 2.040985107421875, 2.11883544921875, 2.196685791015625, 2.2745361328125, 2.352386474609375, 2.43023681640625, 2.508087158203125, 2.5859375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 4.0, 5.0, 7.0, 11.0, 15.0, 11.0, 14.0, 15.0, 16.0, 28.0, 20.0, 29.0, 26.0, 41.0, 30.0, 31.0, 36.0, 37.0, 42.0, 52.0, 1027.0, 78.0, 36.0, 48.0, 31.0, 32.0, 36.0, 37.0, 26.0, 24.0, 36.0, 20.0, 23.0, 22.0, 18.0, 8.0, 10.0, 8.0, 7.0, 6.0, 7.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-85.375, -82.81640625, -80.2578125, -77.69921875, -75.140625, -72.58203125, -70.0234375, -67.46484375, -64.90625, -62.34765625, -59.7890625, -57.23046875, -54.671875, -52.11328125, -49.5546875, -46.99609375, -44.4375, -41.87890625, -39.3203125, -36.76171875, -34.203125, -31.64453125, -29.0859375, -26.52734375, -23.96875, -21.41015625, -18.8515625, -16.29296875, -13.734375, -11.17578125, -8.6171875, -6.05859375, -3.5, -0.94140625, 1.6171875, 4.17578125, 6.734375, 9.29296875, 11.8515625, 14.41015625, 16.96875, 19.52734375, 22.0859375, 24.64453125, 27.203125, 29.76171875, 32.3203125, 34.87890625, 37.4375, 39.99609375, 42.5546875, 45.11328125, 47.671875, 50.23046875, 52.7890625, 55.34765625, 57.90625, 60.46484375, 63.0234375, 65.58203125, 68.140625, 70.69921875, 73.2578125, 75.81640625, 78.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 7.0, 4.0, 4.0, 22.0, 20.0, 44.0, 41.0, 87.0, 122.0, 209.0, 235.0, 384.0, 528.0, 954.0, 1147.0, 1793.0, 2743.0, 3596.0, 5162.0, 7490.0, 11070.0, 16136.0, 22848.0, 34042.0, 49870.0, 75294.0, 114585.0, 185203.0, 312132.0, 3365309.0, 1243443.0, 310196.0, 181954.0, 114526.0, 74536.0, 49345.0, 33455.0, 22634.0, 15567.0, 10577.0, 7670.0, 5215.0, 3651.0, 2419.0, 1653.0, 1129.0, 782.0, 553.0, 390.0, 211.0, 174.0, 98.0, 92.0, 31.0, 27.0, 12.0, 12.0, 14.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.060546875, -1.994049072265625, -1.92755126953125, -1.861053466796875, -1.7945556640625, -1.728057861328125, -1.66156005859375, -1.595062255859375, -1.528564453125, -1.462066650390625, -1.39556884765625, -1.329071044921875, -1.2625732421875, -1.196075439453125, -1.12957763671875, -1.063079833984375, -0.99658203125, -0.930084228515625, -0.86358642578125, -0.797088623046875, -0.7305908203125, -0.664093017578125, -0.59759521484375, -0.531097412109375, -0.464599609375, -0.398101806640625, -0.33160400390625, -0.265106201171875, -0.1986083984375, -0.132110595703125, -0.06561279296875, 0.000885009765625, 0.0673828125, 0.133880615234375, 0.20037841796875, 0.266876220703125, 0.3333740234375, 0.399871826171875, 0.46636962890625, 0.532867431640625, 0.599365234375, 0.665863037109375, 0.73236083984375, 0.798858642578125, 0.8653564453125, 0.931854248046875, 0.99835205078125, 1.064849853515625, 1.13134765625, 1.197845458984375, 1.26434326171875, 1.330841064453125, 1.3973388671875, 1.463836669921875, 1.53033447265625, 1.596832275390625, 1.663330078125, 1.729827880859375, 1.79632568359375, 1.862823486328125, 1.9293212890625, 1.995819091796875, 2.06231689453125, 2.128814697265625, 2.1953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 4.0, 5.0, 6.0, 12.0, 6.0, 10.0, 12.0, 18.0, 20.0, 20.0, 21.0, 23.0, 35.0, 20.0, 35.0, 45.0, 41.0, 38.0, 31.0, 38.0, 50.0, 1020.0, 76.0, 29.0, 31.0, 41.0, 28.0, 33.0, 29.0, 29.0, 30.0, 30.0, 22.0, 26.0, 12.0, 23.0, 11.0, 10.0, 13.0, 6.0, 10.0, 5.0, 6.0, 0.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-111.5625, -108.24609375, -104.9296875, -101.61328125, -98.296875, -94.98046875, -91.6640625, -88.34765625, -85.03125, -81.71484375, -78.3984375, -75.08203125, -71.765625, -68.44921875, -65.1328125, -61.81640625, -58.5, -55.18359375, -51.8671875, -48.55078125, -45.234375, -41.91796875, -38.6015625, -35.28515625, -31.96875, -28.65234375, -25.3359375, -22.01953125, -18.703125, -15.38671875, -12.0703125, -8.75390625, -5.4375, -2.12109375, 1.1953125, 4.51171875, 7.828125, 11.14453125, 14.4609375, 17.77734375, 21.09375, 24.41015625, 27.7265625, 31.04296875, 34.359375, 37.67578125, 40.9921875, 44.30859375, 47.625, 50.94140625, 54.2578125, 57.57421875, 60.890625, 64.20703125, 67.5234375, 70.83984375, 74.15625, 77.47265625, 80.7890625, 84.10546875, 87.421875, 90.73828125, 94.0546875, 97.37109375, 100.6875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 14.0, 19.0, 21.0, 45.0, 45.0, 77.0, 87.0, 134.0, 158.0, 260.0, 324.0, 540.0, 668.0, 1090.0, 1611.0, 2270.0, 3286.0, 5134.0, 7438.0, 11634.0, 19919.0, 38577.0, 111165.0, 5519504.0, 435443.0, 62063.0, 27223.0, 14910.0, 9101.0, 5705.0, 4031.0, 2814.0, 1923.0, 1276.0, 850.0, 656.0, 471.0, 236.0, 167.0, 160.0, 109.0, 99.0, 33.0, 42.0, 19.0, 16.0, 14.0, 4.0, 9.0, 11.0, 1.0, 5.0], "bins": [-7.734375, -7.5181884765625, -7.302001953125, -7.0858154296875, -6.86962890625, -6.6534423828125, -6.437255859375, -6.2210693359375, -6.0048828125, -5.7886962890625, -5.572509765625, -5.3563232421875, -5.14013671875, -4.9239501953125, -4.707763671875, -4.4915771484375, -4.275390625, -4.0592041015625, -3.843017578125, -3.6268310546875, -3.41064453125, -3.1944580078125, -2.978271484375, -2.7620849609375, -2.5458984375, -2.3297119140625, -2.113525390625, -1.8973388671875, -1.68115234375, -1.4649658203125, -1.248779296875, -1.0325927734375, -0.81640625, -0.6002197265625, -0.384033203125, -0.1678466796875, 0.04833984375, 0.2645263671875, 0.480712890625, 0.6968994140625, 0.9130859375, 1.1292724609375, 1.345458984375, 1.5616455078125, 1.77783203125, 1.9940185546875, 2.210205078125, 2.4263916015625, 2.642578125, 2.8587646484375, 3.074951171875, 3.2911376953125, 3.50732421875, 3.7235107421875, 3.939697265625, 4.1558837890625, 4.3720703125, 4.5882568359375, 4.804443359375, 5.0206298828125, 5.23681640625, 5.4530029296875, 5.669189453125, 5.8853759765625, 6.1015625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 6.0, 5.0, 8.0, 11.0, 4.0, 18.0, 16.0, 13.0, 29.0, 30.0, 26.0, 29.0, 35.0, 35.0, 35.0, 44.0, 41.0, 39.0, 47.0, 1026.0, 79.0, 47.0, 53.0, 32.0, 42.0, 33.0, 31.0, 26.0, 31.0, 17.0, 22.0, 11.0, 17.0, 15.0, 11.0, 10.0, 11.0, 14.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0], "bins": [-178.5, -173.513671875, -168.52734375, -163.541015625, -158.5546875, -153.568359375, -148.58203125, -143.595703125, -138.609375, -133.623046875, -128.63671875, -123.650390625, -118.6640625, -113.677734375, -108.69140625, -103.705078125, -98.71875, -93.732421875, -88.74609375, -83.759765625, -78.7734375, -73.787109375, -68.80078125, -63.814453125, -58.828125, -53.841796875, -48.85546875, -43.869140625, -38.8828125, -33.896484375, -28.91015625, -23.923828125, -18.9375, -13.951171875, -8.96484375, -3.978515625, 1.0078125, 5.994140625, 10.98046875, 15.966796875, 20.953125, 25.939453125, 30.92578125, 35.912109375, 40.8984375, 45.884765625, 50.87109375, 55.857421875, 60.84375, 65.830078125, 70.81640625, 75.802734375, 80.7890625, 85.775390625, 90.76171875, 95.748046875, 100.734375, 105.720703125, 110.70703125, 115.693359375, 120.6796875, 125.666015625, 130.65234375, 135.638671875, 140.625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 1009.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5949.55517578125, -5826.44970703125, -5703.34423828125, -5580.23876953125, -5457.13330078125, -5334.02783203125, -5210.92236328125, -5087.8173828125, -4964.7119140625, -4841.6064453125, -4718.5009765625, -4595.3955078125, -4472.2900390625, -4349.1845703125, -4226.0791015625, -4102.9736328125, -3979.8681640625, -3856.7626953125, -3733.6572265625, -3610.5517578125, -3487.4462890625, -3364.3408203125, -3241.235595703125, -3118.130126953125, -2995.024658203125, -2871.919189453125, -2748.813720703125, -2625.708251953125, -2502.60302734375, -2379.49755859375, -2256.39208984375, -2133.28662109375, -2010.18115234375, -1887.07568359375, -1763.97021484375, -1640.8648681640625, -1517.7593994140625, -1394.6539306640625, -1271.548583984375, -1148.443115234375, -1025.337646484375, -902.232177734375, -779.1267700195312, -656.0213623046875, -532.9158935546875, -409.8104248046875, -286.70501708984375, -163.599609375, -40.494140625, 82.61129760742188, 205.71673583984375, 328.8221740722656, 451.9276123046875, 575.0330810546875, 698.1384887695312, 821.243896484375, 944.349365234375, 1067.454833984375, 1190.560302734375, 1313.6656494140625, 1436.7711181640625, 1559.8765869140625, 1682.98193359375, 1806.08740234375, 1929.19287109375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 11.0, 9.0, 5.0, 12.0, 5.0, 11.0, 14.0, 16.0, 18.0, 34.0, 34.0, 40.0, 50.0, 45.0, 41.0, 46.0, 57.0, 54.0, 56.0, 51.0, 51.0, 37.0, 37.0, 38.0, 39.0, 36.0, 28.0, 28.0, 18.0, 24.0, 11.0, 9.0, 10.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-594.458984375, -577.4942016601562, -560.5294189453125, -543.564697265625, -526.5999145507812, -509.6351318359375, -492.67034912109375, -475.7055969238281, -458.7408447265625, -441.77606201171875, -424.8113098144531, -407.8465270996094, -390.88177490234375, -373.9169921875, -356.95220947265625, -339.9874572753906, -323.0226745605469, -306.0578918457031, -289.0931396484375, -272.12835693359375, -255.16360473632812, -238.19882202148438, -221.2340545654297, -204.269287109375, -187.3045196533203, -170.33975219726562, -153.37498474121094, -136.41021728515625, -119.44544219970703, -102.48067474365234, -85.51589965820312, -68.55113220214844, -51.586334228515625, -34.62156677246094, -17.656795501708984, -0.6920242309570312, 16.272743225097656, 33.237510681152344, 50.20228576660156, 67.16705322265625, 84.13182067871094, 101.09658813476562, 118.06135559082031, 135.026123046875, 151.99090576171875, 168.95565795898438, 185.92044067382812, 202.8852081298828, 219.8499755859375, 236.8147430419922, 253.77951049804688, 270.7442932128906, 287.70904541015625, 304.673828125, 321.63861083984375, 338.6033630371094, 355.568115234375, 372.53289794921875, 389.4976501464844, 406.4624328613281, 423.42718505859375, 440.3919677734375, 457.35675048828125, 474.3215026855469, 491.2862854003906]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 5.0, 16.0, 4.0, 11.0, 7.0, 18.0, 23.0, 23.0, 32.0, 28.0, 53.0, 63.0, 107.0, 493.0, 828.0, 3654.0, 11216.0, 43904.0, 4084772.0, 37347.0, 7473.0, 2339.0, 946.0, 239.0, 133.0, 123.0, 81.0, 60.0, 57.0, 40.0, 31.0, 29.0, 23.0, 14.0, 13.0, 10.0, 17.0, 6.0, 7.0, 8.0, 7.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.406005859375, -0.3917732238769531, -0.37754058837890625, -0.3633079528808594, -0.3490753173828125, -0.3348426818847656, -0.32061004638671875, -0.3063774108886719, -0.292144775390625, -0.2779121398925781, -0.26367950439453125, -0.24944686889648438, -0.2352142333984375, -0.22098159790039062, -0.20674896240234375, -0.19251632690429688, -0.17828369140625, -0.16405105590820312, -0.14981842041015625, -0.13558578491210938, -0.1213531494140625, -0.10712051391601562, -0.09288787841796875, -0.07865524291992188, -0.064422607421875, -0.050189971923828125, -0.03595733642578125, -0.021724700927734375, -0.0074920654296875, 0.006740570068359375, 0.02097320556640625, 0.035205841064453125, 0.0494384765625, 0.06367111206054688, 0.07790374755859375, 0.09213638305664062, 0.1063690185546875, 0.12060165405273438, 0.13483428955078125, 0.14906692504882812, 0.163299560546875, 0.17753219604492188, 0.19176483154296875, 0.20599746704101562, 0.2202301025390625, 0.23446273803710938, 0.24869537353515625, 0.2629280090332031, 0.27716064453125, 0.2913932800292969, 0.30562591552734375, 0.3198585510253906, 0.3340911865234375, 0.3483238220214844, 0.36255645751953125, 0.3767890930175781, 0.391021728515625, 0.4052543640136719, 0.41948699951171875, 0.4337196350097656, 0.4479522705078125, 0.4621849060058594, 0.47641754150390625, 0.4906501770019531, 0.5048828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 8.0, 8.0, 10.0, 11.0, 23.0, 52.0, 753.0, 24.0, 7.0, 22.0, 11.0, 5.0, 3.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.341064453125, -0.32913970947265625, -0.3172149658203125, -0.30529022216796875, -0.293365478515625, -0.28144073486328125, -0.2695159912109375, -0.25759124755859375, -0.24566650390625, -0.23374176025390625, -0.2218170166015625, -0.20989227294921875, -0.197967529296875, -0.18604278564453125, -0.1741180419921875, -0.16219329833984375, -0.1502685546875, -0.13834381103515625, -0.1264190673828125, -0.11449432373046875, -0.102569580078125, -0.09064483642578125, -0.0787200927734375, -0.06679534912109375, -0.05487060546875, -0.04294586181640625, -0.0310211181640625, -0.01909637451171875, -0.007171630859375, 0.00475311279296875, 0.0166778564453125, 0.02860260009765625, 0.04052734375, 0.05245208740234375, 0.0643768310546875, 0.07630157470703125, 0.088226318359375, 0.10015106201171875, 0.1120758056640625, 0.12400054931640625, 0.13592529296875, 0.14785003662109375, 0.1597747802734375, 0.17169952392578125, 0.183624267578125, 0.19554901123046875, 0.2074737548828125, 0.21939849853515625, 0.2313232421875, 0.24324798583984375, 0.2551727294921875, 0.26709747314453125, 0.279022216796875, 0.29094696044921875, 0.3028717041015625, 0.31479644775390625, 0.32672119140625, 0.33864593505859375, 0.3505706787109375, 0.36249542236328125, 0.374420166015625, 0.38634490966796875, 0.3982696533203125, 0.41019439697265625, 0.422119140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 6.0, 4.0, 13.0, 8.0, 23.0, 23.0, 37.0, 77.0, 245.0, 1961.0, 454852.0, 3732904.0, 3330.0, 497.0, 160.0, 50.0, 28.0, 20.0, 10.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.9638671875, -1.8984375, -1.8330078125, -1.767578125, -1.7021484375, -1.63671875, -1.5712890625, -1.505859375, -1.4404296875, -1.375, -1.3095703125, -1.244140625, -1.1787109375, -1.11328125, -1.0478515625, -0.982421875, -0.9169921875, -0.8515625, -0.7861328125, -0.720703125, -0.6552734375, -0.58984375, -0.5244140625, -0.458984375, -0.3935546875, -0.328125, -0.2626953125, -0.197265625, -0.1318359375, -0.06640625, -0.0009765625, 0.064453125, 0.1298828125, 0.1953125, 0.2607421875, 0.326171875, 0.3916015625, 0.45703125, 0.5224609375, 0.587890625, 0.6533203125, 0.71875, 0.7841796875, 0.849609375, 0.9150390625, 0.98046875, 1.0458984375, 1.111328125, 1.1767578125, 1.2421875, 1.3076171875, 1.373046875, 1.4384765625, 1.50390625, 1.5693359375, 1.634765625, 1.7001953125, 1.765625, 1.8310546875, 1.896484375, 1.9619140625, 2.02734375, 2.0927734375, 2.158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 9.0, 13.0, 21.0, 50.0, 294.0, 2987.0, 487.0, 113.0, 21.0, 12.0, 8.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.482452392578125, -0.46197509765625, -0.441497802734375, -0.4210205078125, -0.400543212890625, -0.38006591796875, -0.359588623046875, -0.339111328125, -0.318634033203125, -0.29815673828125, -0.277679443359375, -0.2572021484375, -0.236724853515625, -0.21624755859375, -0.195770263671875, -0.17529296875, -0.154815673828125, -0.13433837890625, -0.113861083984375, -0.0933837890625, -0.072906494140625, -0.05242919921875, -0.031951904296875, -0.011474609375, 0.009002685546875, 0.02947998046875, 0.049957275390625, 0.0704345703125, 0.090911865234375, 0.11138916015625, 0.131866455078125, 0.15234375, 0.172821044921875, 0.19329833984375, 0.213775634765625, 0.2342529296875, 0.254730224609375, 0.27520751953125, 0.295684814453125, 0.316162109375, 0.336639404296875, 0.35711669921875, 0.377593994140625, 0.3980712890625, 0.418548583984375, 0.43902587890625, 0.459503173828125, 0.47998046875, 0.500457763671875, 0.52093505859375, 0.541412353515625, 0.5618896484375, 0.582366943359375, 0.60284423828125, 0.623321533203125, 0.643798828125, 0.664276123046875, 0.68475341796875, 0.705230712890625, 0.7257080078125, 0.746185302734375, 0.76666259765625, 0.787139892578125, 0.8076171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 12.0, 473.0, 511.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.223158597946167, -1.1416348218917847, -1.0601110458374023, -0.9785873889923096, -0.8970636129379272, -0.8155398368835449, -0.7340161204338074, -0.6524924039840698, -0.5709686279296875, -0.48944488167762756, -0.4079211354255676, -0.3263973891735077, -0.24487364292144775, -0.16334989666938782, -0.08182615041732788, -0.00030243396759033203, 0.08122134208679199, 0.16274508833885193, 0.24426883459091187, 0.3257925808429718, 0.40731632709503174, 0.4888400733470917, 0.5703638195991516, 0.6518875360488892, 0.7334113121032715, 0.8149350881576538, 0.8964588046073914, 0.9779825210571289, 1.0595062971115112, 1.1410300731658936, 1.2225537300109863, 1.3040775060653687, 1.38560152053833, 1.4671252965927124, 1.5486490726470947, 1.6301727294921875, 1.7116965055465698, 1.7932202816009521, 1.874743938446045, 1.9562677145004272, 2.0377914905548096, 2.1193151473999023, 2.200839042663574, 2.282362699508667, 2.3638863563537598, 2.4454102516174316, 2.5269339084625244, 2.608457565307617, 2.689981460571289, 2.771505117416382, 2.8530290126800537, 2.9345526695251465, 3.0160765647888184, 3.097600221633911, 3.179123878479004, 3.260647773742676, 3.3421714305877686, 3.4236950874328613, 3.505218982696533, 3.586742639541626, 3.6682662963867188, 3.7497901916503906, 3.8313138484954834, 3.912837505340576, 3.994361400604248]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 6.0, 6.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 5.0, 6.0, 9.0, 14.0, 39.0, 40.0, 54.0, 94.0, 116.0, 129.0, 118.0, 85.0, 78.0, 48.0, 32.0, 15.0, 12.0, 11.0, 11.0, 11.0, 7.0, 2.0, 3.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0566911697387695, -1.993713617324829, -1.9307361841201782, -1.8677586317062378, -1.8047810792922974, -1.7418036460876465, -1.678826093673706, -1.6158485412597656, -1.5528709888458252, -1.4898934364318848, -1.4269160032272339, -1.3639384508132935, -1.300960898399353, -1.2379834651947021, -1.1750059127807617, -1.1120283603668213, -1.0490509271621704, -0.9860734343528748, -0.9230958819389343, -0.8601183891296387, -0.7971408367156982, -0.7341633439064026, -0.6711858510971069, -0.6082082986831665, -0.5452308058738708, -0.4822532832622528, -0.41927576065063477, -0.3562982678413391, -0.29332074522972107, -0.23034322261810303, -0.16736572980880737, -0.10438820719718933, -0.04141068458557129, 0.021566830575466156, 0.0845443457365036, 0.14752185344696045, 0.2104993760585785, 0.27347689867019653, 0.3364543914794922, 0.39943191409111023, 0.46240943670272827, 0.5253869295120239, 0.5883644819259644, 0.65134197473526, 0.7143194675445557, 0.7772970199584961, 0.8402745127677917, 0.9032520055770874, 0.9662295579910278, 1.0292071104049683, 1.0921845436096191, 1.1551620960235596, 1.2181396484375, 1.2811172008514404, 1.3440946340560913, 1.4070721864700317, 1.4700496196746826, 1.533027172088623, 1.596004605293274, 1.6589821577072144, 1.7219597101211548, 1.7849371433258057, 1.847914695739746, 1.9108922481536865, 1.973869800567627]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 13.0, 15.0, 21.0, 32.0, 31.0, 46.0, 67.0, 94.0, 135.0, 187.0, 276.0, 353.0, 489.0, 668.0, 942.0, 1376.0, 1930.0, 2886.0, 4332.0, 7072.0, 13262.0, 35969.0, 911769.0, 33470.0, 12840.0, 6848.0, 4161.0, 2745.0, 1782.0, 1335.0, 964.0, 690.0, 484.0, 337.0, 249.0, 187.0, 128.0, 96.0, 83.0, 51.0, 38.0, 26.0, 18.0, 15.0, 11.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.552734375, -0.5357131958007812, -0.5186920166015625, -0.5016708374023438, -0.484649658203125, -0.46762847900390625, -0.4506072998046875, -0.43358612060546875, -0.41656494140625, -0.39954376220703125, -0.3825225830078125, -0.36550140380859375, -0.348480224609375, -0.33145904541015625, -0.3144378662109375, -0.29741668701171875, -0.2803955078125, -0.26337432861328125, -0.2463531494140625, -0.22933197021484375, -0.212310791015625, -0.19528961181640625, -0.1782684326171875, -0.16124725341796875, -0.14422607421875, -0.12720489501953125, -0.1101837158203125, -0.09316253662109375, -0.076141357421875, -0.05912017822265625, -0.0420989990234375, -0.02507781982421875, -0.008056640625, 0.00896453857421875, 0.0259857177734375, 0.04300689697265625, 0.060028076171875, 0.07704925537109375, 0.0940704345703125, 0.11109161376953125, 0.12811279296875, 0.14513397216796875, 0.1621551513671875, 0.17917633056640625, 0.196197509765625, 0.21321868896484375, 0.2302398681640625, 0.24726104736328125, 0.2642822265625, 0.28130340576171875, 0.2983245849609375, 0.31534576416015625, 0.332366943359375, 0.34938812255859375, 0.3664093017578125, 0.38343048095703125, 0.40045166015625, 0.41747283935546875, 0.4344940185546875, 0.45151519775390625, 0.468536376953125, 0.48555755615234375, 0.5025787353515625, 0.5195999145507812, 0.53662109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 6.0, 10.0, 7.0, 9.0, 17.0, 28.0, 765.0, 38.0, 16.0, 15.0, 14.0, 9.0, 3.0, 5.0, 7.0, 4.0, 5.0, 1.0, 3.0, 4.0, 1.0, 6.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3427734375, -0.3309669494628906, -0.31916046142578125, -0.3073539733886719, -0.2955474853515625, -0.2837409973144531, -0.27193450927734375, -0.2601280212402344, -0.248321533203125, -0.23651504516601562, -0.22470855712890625, -0.21290206909179688, -0.2010955810546875, -0.18928909301757812, -0.17748260498046875, -0.16567611694335938, -0.15386962890625, -0.14206314086914062, -0.13025665283203125, -0.11845016479492188, -0.1066436767578125, -0.09483718872070312, -0.08303070068359375, -0.07122421264648438, -0.059417724609375, -0.047611236572265625, -0.03580474853515625, -0.023998260498046875, -0.0121917724609375, -0.000385284423828125, 0.01142120361328125, 0.023227691650390625, 0.0350341796875, 0.046840667724609375, 0.05864715576171875, 0.07045364379882812, 0.0822601318359375, 0.09406661987304688, 0.10587310791015625, 0.11767959594726562, 0.129486083984375, 0.14129257202148438, 0.15309906005859375, 0.16490554809570312, 0.1767120361328125, 0.18851852416992188, 0.20032501220703125, 0.21213150024414062, 0.22393798828125, 0.23574447631835938, 0.24755096435546875, 0.2593574523925781, 0.2711639404296875, 0.2829704284667969, 0.29477691650390625, 0.3065834045410156, 0.318389892578125, 0.3301963806152344, 0.34200286865234375, 0.3538093566894531, 0.3656158447265625, 0.3774223327636719, 0.38922882080078125, 0.4010353088378906, 0.412841796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 9.0, 8.0, 9.0, 13.0, 8.0, 14.0, 21.0, 22.0, 24.0, 40.0, 47.0, 72.0, 71.0, 101.0, 186.0, 293.0, 640.0, 2464.0, 12850.0, 288745.0, 719392.0, 18643.0, 3107.0, 758.0, 309.0, 165.0, 121.0, 92.0, 57.0, 56.0, 43.0, 30.0, 25.0, 21.0, 22.0, 12.0, 12.0, 9.0, 5.0, 9.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.25, -1.2084503173828125, -1.166900634765625, -1.1253509521484375, -1.08380126953125, -1.0422515869140625, -1.000701904296875, -0.9591522216796875, -0.9176025390625, -0.8760528564453125, -0.834503173828125, -0.7929534912109375, -0.75140380859375, -0.7098541259765625, -0.668304443359375, -0.6267547607421875, -0.585205078125, -0.5436553955078125, -0.502105712890625, -0.4605560302734375, -0.41900634765625, -0.3774566650390625, -0.335906982421875, -0.2943572998046875, -0.2528076171875, -0.2112579345703125, -0.169708251953125, -0.1281585693359375, -0.08660888671875, -0.0450592041015625, -0.003509521484375, 0.0380401611328125, 0.07958984375, 0.1211395263671875, 0.162689208984375, 0.2042388916015625, 0.24578857421875, 0.2873382568359375, 0.328887939453125, 0.3704376220703125, 0.4119873046875, 0.4535369873046875, 0.495086669921875, 0.5366363525390625, 0.57818603515625, 0.6197357177734375, 0.661285400390625, 0.7028350830078125, 0.744384765625, 0.7859344482421875, 0.827484130859375, 0.8690338134765625, 0.91058349609375, 0.9521331787109375, 0.993682861328125, 1.0352325439453125, 1.0767822265625, 1.1183319091796875, 1.159881591796875, 1.2014312744140625, 1.24298095703125, 1.2845306396484375, 1.326080322265625, 1.3676300048828125, 1.4091796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 8.0, 8.0, 13.0, 7.0, 13.0, 20.0, 19.0, 16.0, 21.0, 22.0, 29.0, 22.0, 27.0, 50.0, 40.0, 44.0, 43.0, 40.0, 44.0, 34.0, 30.0, 31.0, 37.0, 36.0, 39.0, 38.0, 36.0, 24.0, 25.0, 29.0, 21.0, 16.0, 17.0, 19.0, 11.0, 12.0, 9.0, 5.0, 8.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2958984375, -1.2528228759765625, -1.209747314453125, -1.1666717529296875, -1.12359619140625, -1.0805206298828125, -1.037445068359375, -0.9943695068359375, -0.9512939453125, -0.9082183837890625, -0.865142822265625, -0.8220672607421875, -0.77899169921875, -0.7359161376953125, -0.692840576171875, -0.6497650146484375, -0.606689453125, -0.5636138916015625, -0.520538330078125, -0.4774627685546875, -0.43438720703125, -0.3913116455078125, -0.348236083984375, -0.3051605224609375, -0.2620849609375, -0.2190093994140625, -0.175933837890625, -0.1328582763671875, -0.08978271484375, -0.0467071533203125, -0.003631591796875, 0.0394439697265625, 0.08251953125, 0.1255950927734375, 0.168670654296875, 0.2117462158203125, 0.25482177734375, 0.2978973388671875, 0.340972900390625, 0.3840484619140625, 0.4271240234375, 0.4701995849609375, 0.513275146484375, 0.5563507080078125, 0.59942626953125, 0.6425018310546875, 0.685577392578125, 0.7286529541015625, 0.771728515625, 0.8148040771484375, 0.857879638671875, 0.9009552001953125, 0.94403076171875, 0.9871063232421875, 1.030181884765625, 1.0732574462890625, 1.1163330078125, 1.1594085693359375, 1.202484130859375, 1.2455596923828125, 1.28863525390625, 1.3317108154296875, 1.374786376953125, 1.4178619384765625, 1.4609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 11.0, 15.0, 14.0, 21.0, 30.0, 59.0, 102.0, 193.0, 460.0, 1275.0, 5076.0, 47943.0, 957935.0, 29668.0, 3871.0, 1049.0, 408.0, 173.0, 102.0, 44.0, 38.0, 13.0, 12.0, 13.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005049705505371094, -0.00048428773880004883, -0.0004636049270629883, -0.00044292211532592773, -0.0004222393035888672, -0.00040155649185180664, -0.0003808736801147461, -0.00036019086837768555, -0.000339508056640625, -0.00031882524490356445, -0.0002981424331665039, -0.00027745962142944336, -0.0002567768096923828, -0.00023609399795532227, -0.00021541118621826172, -0.00019472837448120117, -0.00017404556274414062, -0.00015336275100708008, -0.00013267993927001953, -0.00011199712753295898, -9.131431579589844e-05, -7.063150405883789e-05, -4.9948692321777344e-05, -2.9265880584716797e-05, -8.58306884765625e-06, 1.2099742889404297e-05, 3.2782554626464844e-05, 5.346536636352539e-05, 7.414817810058594e-05, 9.483098983764648e-05, 0.00011551380157470703, 0.00013619661331176758, 0.00015687942504882812, 0.00017756223678588867, 0.00019824504852294922, 0.00021892786026000977, 0.0002396106719970703, 0.00026029348373413086, 0.0002809762954711914, 0.00030165910720825195, 0.0003223419189453125, 0.00034302473068237305, 0.0003637075424194336, 0.00038439035415649414, 0.0004050731658935547, 0.00042575597763061523, 0.0004464387893676758, 0.00046712160110473633, 0.0004878044128417969, 0.0005084872245788574, 0.000529170036315918, 0.0005498528480529785, 0.0005705356597900391, 0.0005912184715270996, 0.0006119012832641602, 0.0006325840950012207, 0.0006532669067382812, 0.0006739497184753418, 0.0006946325302124023, 0.0007153153419494629, 0.0007359981536865234, 0.000756680965423584, 0.0007773637771606445, 0.0007980465888977051, 0.0008187294006347656]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 2.0, 5.0, 1.0, 13.0, 8.0, 7.0, 28.0, 14.0, 32.0, 22.0, 54.0, 23.0, 53.0, 30.0, 34.0, 60.0, 32.0, 60.0, 41.0, 82.0, 20.0, 39.0, 58.0, 32.0, 49.0, 22.0, 38.0, 17.0, 39.0, 15.0, 11.0, 19.0, 5.0, 13.0, 5.0, 11.0, 2.0, 0.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3581087589263916e-06, -2.2724270820617676e-06, -2.1867454051971436e-06, -2.1010637283325195e-06, -2.0153820514678955e-06, -1.9297003746032715e-06, -1.8440186977386475e-06, -1.7583370208740234e-06, -1.6726553440093994e-06, -1.5869736671447754e-06, -1.5012919902801514e-06, -1.4156103134155273e-06, -1.3299286365509033e-06, -1.2442469596862793e-06, -1.1585652828216553e-06, -1.0728836059570312e-06, -9.872019290924072e-07, -9.015202522277832e-07, -8.158385753631592e-07, -7.301568984985352e-07, -6.444752216339111e-07, -5.587935447692871e-07, -4.731118679046631e-07, -3.8743019104003906e-07, -3.0174851417541504e-07, -2.1606683731079102e-07, -1.30385160446167e-07, -4.470348358154297e-08, 4.0978193283081055e-08, 1.2665987014770508e-07, 2.123415470123291e-07, 2.980232238769531e-07, 3.8370490074157715e-07, 4.6938657760620117e-07, 5.550682544708252e-07, 6.407499313354492e-07, 7.264316082000732e-07, 8.121132850646973e-07, 8.977949619293213e-07, 9.834766387939453e-07, 1.0691583156585693e-06, 1.1548399925231934e-06, 1.2405216693878174e-06, 1.3262033462524414e-06, 1.4118850231170654e-06, 1.4975666999816895e-06, 1.5832483768463135e-06, 1.6689300537109375e-06, 1.7546117305755615e-06, 1.8402934074401855e-06, 1.9259750843048096e-06, 2.0116567611694336e-06, 2.0973384380340576e-06, 2.1830201148986816e-06, 2.2687017917633057e-06, 2.3543834686279297e-06, 2.4400651454925537e-06, 2.5257468223571777e-06, 2.6114284992218018e-06, 2.6971101760864258e-06, 2.78279185295105e-06, 2.868473529815674e-06, 2.954155206680298e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 7.0, 3.0, 8.0, 7.0, 10.0, 7.0, 10.0, 18.0, 35.0, 37.0, 53.0, 69.0, 131.0, 264.0, 563.0, 2217.0, 18263.0, 965580.0, 55843.0, 3816.0, 851.0, 292.0, 153.0, 78.0, 50.0, 45.0, 37.0, 28.0, 17.0, 12.0, 10.0, 8.0, 6.0, 8.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00039505958557128906, -0.0003817416727542877, -0.0003684237599372864, -0.00035510584712028503, -0.0003417879343032837, -0.00032847002148628235, -0.000315152108669281, -0.00030183419585227966, -0.0002885162830352783, -0.000275198370218277, -0.00026188045740127563, -0.0002485625445842743, -0.00023524463176727295, -0.0002219267189502716, -0.00020860880613327026, -0.00019529089331626892, -0.00018197298049926758, -0.00016865506768226624, -0.0001553371548652649, -0.00014201924204826355, -0.0001287013292312622, -0.00011538341641426086, -0.00010206550359725952, -8.874759078025818e-05, -7.542967796325684e-05, -6.211176514625549e-05, -4.879385232925415e-05, -3.547593951225281e-05, -2.2158026695251465e-05, -8.840113878250122e-06, 4.477798938751221e-06, 1.7795711755752563e-05, 3.1113624572753906e-05, 4.443153738975525e-05, 5.774945020675659e-05, 7.106736302375793e-05, 8.438527584075928e-05, 9.770318865776062e-05, 0.00011102110147476196, 0.0001243390142917633, 0.00013765692710876465, 0.000150974839925766, 0.00016429275274276733, 0.00017761066555976868, 0.00019092857837677002, 0.00020424649119377136, 0.0002175644040107727, 0.00023088231682777405, 0.0002442002296447754, 0.00025751814246177673, 0.0002708360552787781, 0.0002841539680957794, 0.00029747188091278076, 0.0003107897937297821, 0.00032410770654678345, 0.0003374256193637848, 0.00035074353218078613, 0.0003640614449977875, 0.0003773793578147888, 0.00039069727063179016, 0.0004040151834487915, 0.00041733309626579285, 0.0004306510090827942, 0.00044396892189979553, 0.0004572868347167969]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 6.0, 14.0, 20.0, 19.0, 24.0, 29.0, 43.0, 49.0, 55.0, 65.0, 76.0, 77.0, 75.0, 70.0, 67.0, 49.0, 44.0, 36.0, 21.0, 23.0, 25.0, 16.0, 13.0, 9.0, 6.0, 9.0, 5.0, 8.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0004096031188964844, -0.0003957971930503845, -0.00038199126720428467, -0.0003681853413581848, -0.00035437941551208496, -0.0003405734896659851, -0.00032676756381988525, -0.0003129616379737854, -0.00029915571212768555, -0.0002853497862815857, -0.00027154386043548584, -0.000257737934589386, -0.00024393200874328613, -0.00023012608289718628, -0.00021632015705108643, -0.00020251423120498657, -0.00018870830535888672, -0.00017490237951278687, -0.000161096453666687, -0.00014729052782058716, -0.0001334846019744873, -0.00011967867612838745, -0.0001058727502822876, -9.206682443618774e-05, -7.826089859008789e-05, -6.445497274398804e-05, -5.0649046897888184e-05, -3.684312105178833e-05, -2.3037195205688477e-05, -9.231269359588623e-06, 4.5746564865112305e-06, 1.8380582332611084e-05, 3.218650817871094e-05, 4.599243402481079e-05, 5.9798359870910645e-05, 7.36042857170105e-05, 8.741021156311035e-05, 0.0001012161374092102, 0.00011502206325531006, 0.0001288279891014099, 0.00014263391494750977, 0.00015643984079360962, 0.00017024576663970947, 0.00018405169248580933, 0.00019785761833190918, 0.00021166354417800903, 0.0002254694700241089, 0.00023927539587020874, 0.0002530813217163086, 0.00026688724756240845, 0.0002806931734085083, 0.00029449909925460815, 0.000308305025100708, 0.00032211095094680786, 0.0003359168767929077, 0.00034972280263900757, 0.0003635287284851074, 0.0003773346543312073, 0.00039114058017730713, 0.000404946506023407, 0.00041875243186950684, 0.0004325583577156067, 0.00044636428356170654, 0.0004601702094078064, 0.00047397613525390625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 33.0, 928.0, 40.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.613487243652344, -13.671551704406738, -12.729616165161133, -11.787681579589844, -10.845746040344238, -9.903810501098633, -8.961875915527344, -8.019940376281738, -7.078004837036133, -6.136069297790527, -5.19413423538208, -4.252199172973633, -3.3102636337280273, -2.368328094482422, -1.4263930320739746, -0.48445796966552734, 0.4574775695800781, 1.3994128704071045, 2.341348171234131, 3.2832834720611572, 4.225218772888184, 5.167154312133789, 6.109089374542236, 7.051024436950684, 7.992959976196289, 8.934895515441895, 9.8768310546875, 10.818765640258789, 11.760701179504395, 12.70263671875, 13.644571304321289, 14.586506843566895, 15.5284423828125, 16.47037696838379, 17.41231346130371, 18.354248046875, 19.296184539794922, 20.23811912536621, 21.1800537109375, 22.121990203857422, 23.06392478942871, 24.005859375, 24.947795867919922, 25.88973045349121, 26.8316650390625, 27.773601531982422, 28.71553611755371, 29.657470703125, 30.599407196044922, 31.54134178161621, 32.4832763671875, 33.42521286010742, 34.367149353027344, 35.30908203125, 36.25101852416992, 37.192955017089844, 38.1348876953125, 39.07682418823242, 40.01875686645508, 40.960693359375, 41.90262985229492, 42.844566345214844, 43.7864990234375, 44.72843551635742, 45.670372009277344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 3.0, 14.0, 20.0, 13.0, 25.0, 44.0, 73.0, 112.0, 156.0, 155.0, 127.0, 95.0, 47.0, 24.0, 16.0, 6.0, 10.0, 9.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.740238189697266, -33.80185317993164, -32.863468170166016, -31.925081253051758, -30.986696243286133, -30.048309326171875, -29.10992431640625, -28.171539306640625, -27.233154296875, -26.294769287109375, -25.356382369995117, -24.417997360229492, -23.479612350463867, -22.54122543334961, -21.602840423583984, -20.66445541381836, -19.7260684967041, -18.787683486938477, -17.84929656982422, -16.910911560058594, -15.972526550292969, -15.034140586853027, -14.095754623413086, -13.157369613647461, -12.21898365020752, -11.280597686767578, -10.342212677001953, -9.403826713562012, -8.46544075012207, -7.527055740356445, -6.588669776916504, -5.650284290313721, -4.7118988037109375, -3.7735133171081543, -2.835127592086792, -1.8967418670654297, -0.9583563804626465, -0.01997089385986328, 0.9184150695800781, 1.8568005561828613, 2.7951860427856445, 3.7335715293884277, 4.671957015991211, 5.610342979431152, 6.5487284660339355, 7.487113952636719, 8.42549991607666, 9.363885879516602, 10.302270889282227, 11.240656852722168, 12.179041862487793, 13.117427825927734, 14.05581283569336, 14.9941987991333, 15.932584762573242, 16.870969772338867, 17.809356689453125, 18.74774169921875, 19.686128616333008, 20.624513626098633, 21.562898635864258, 22.501285552978516, 23.43967056274414, 24.378055572509766, 25.31644058227539]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 13.0, 15.0, 25.0, 44.0, 128.0, 349.0, 963.0, 4875.0, 4168870.0, 14463.0, 2985.0, 917.0, 334.0, 119.0, 45.0, 31.0, 13.0, 13.0, 13.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.1796875, -5.010986328125, -4.84228515625, -4.673583984375, -4.5048828125, -4.336181640625, -4.16748046875, -3.998779296875, -3.830078125, -3.661376953125, -3.49267578125, -3.323974609375, -3.1552734375, -2.986572265625, -2.81787109375, -2.649169921875, -2.48046875, -2.311767578125, -2.14306640625, -1.974365234375, -1.8056640625, -1.636962890625, -1.46826171875, -1.299560546875, -1.130859375, -0.962158203125, -0.79345703125, -0.624755859375, -0.4560546875, -0.287353515625, -0.11865234375, 0.050048828125, 0.21875, 0.387451171875, 0.55615234375, 0.724853515625, 0.8935546875, 1.062255859375, 1.23095703125, 1.399658203125, 1.568359375, 1.737060546875, 1.90576171875, 2.074462890625, 2.2431640625, 2.411865234375, 2.58056640625, 2.749267578125, 2.91796875, 3.086669921875, 3.25537109375, 3.424072265625, 3.5927734375, 3.761474609375, 3.93017578125, 4.098876953125, 4.267578125, 4.436279296875, 4.60498046875, 4.773681640625, 4.9423828125, 5.111083984375, 5.27978515625, 5.448486328125, 5.6171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 5.0, 9.0, 7.0, 12.0, 12.0, 18.0, 96.0, 689.0, 31.0, 17.0, 8.0, 8.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 8.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2802734375, -0.2711448669433594, -0.26201629638671875, -0.2528877258300781, -0.2437591552734375, -0.23463058471679688, -0.22550201416015625, -0.21637344360351562, -0.207244873046875, -0.19811630249023438, -0.18898773193359375, -0.17985916137695312, -0.1707305908203125, -0.16160202026367188, -0.15247344970703125, -0.14334487915039062, -0.13421630859375, -0.12508773803710938, -0.11595916748046875, -0.10683059692382812, -0.0977020263671875, -0.08857345581054688, -0.07944488525390625, -0.07031631469726562, -0.061187744140625, -0.052059173583984375, -0.04293060302734375, -0.033802032470703125, -0.0246734619140625, -0.015544891357421875, -0.00641632080078125, 0.002712249755859375, 0.0118408203125, 0.020969390869140625, 0.03009796142578125, 0.039226531982421875, 0.0483551025390625, 0.057483673095703125, 0.06661224365234375, 0.07574081420898438, 0.084869384765625, 0.09399795532226562, 0.10312652587890625, 0.11225509643554688, 0.1213836669921875, 0.13051223754882812, 0.13964080810546875, 0.14876937866210938, 0.15789794921875, 0.16702651977539062, 0.17615509033203125, 0.18528366088867188, 0.1944122314453125, 0.20354080200195312, 0.21266937255859375, 0.22179794311523438, 0.230926513671875, 0.24005508422851562, 0.24918365478515625, 0.2583122253417969, 0.2674407958984375, 0.2765693664550781, 0.28569793701171875, 0.2948265075683594, 0.303955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 10.0, 6.0, 15.0, 6.0, 11.0, 22.0, 28.0, 41.0, 38.0, 68.0, 169.0, 386.0, 1609.0, 15011.0, 4141457.0, 31756.0, 2558.0, 558.0, 206.0, 86.0, 74.0, 36.0, 19.0, 24.0, 22.0, 19.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84375, -3.70941162109375, -3.5750732421875, -3.44073486328125, -3.306396484375, -3.17205810546875, -3.0377197265625, -2.90338134765625, -2.76904296875, -2.63470458984375, -2.5003662109375, -2.36602783203125, -2.231689453125, -2.09735107421875, -1.9630126953125, -1.82867431640625, -1.6943359375, -1.55999755859375, -1.4256591796875, -1.29132080078125, -1.156982421875, -1.02264404296875, -0.8883056640625, -0.75396728515625, -0.61962890625, -0.48529052734375, -0.3509521484375, -0.21661376953125, -0.082275390625, 0.05206298828125, 0.1864013671875, 0.32073974609375, 0.455078125, 0.58941650390625, 0.7237548828125, 0.85809326171875, 0.992431640625, 1.12677001953125, 1.2611083984375, 1.39544677734375, 1.52978515625, 1.66412353515625, 1.7984619140625, 1.93280029296875, 2.067138671875, 2.20147705078125, 2.3358154296875, 2.47015380859375, 2.6044921875, 2.73883056640625, 2.8731689453125, 3.00750732421875, 3.141845703125, 3.27618408203125, 3.4105224609375, 3.54486083984375, 3.67919921875, 3.81353759765625, 3.9478759765625, 4.08221435546875, 4.216552734375, 4.35089111328125, 4.4852294921875, 4.61956787109375, 4.75390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 1.0, 4.0, 7.0, 16.0, 7.0, 12.0, 9.0, 17.0, 21.0, 24.0, 29.0, 272.0, 3419.0, 30.0, 28.0, 21.0, 21.0, 17.0, 20.0, 9.0, 12.0, 20.0, 2.0, 12.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.49417877197265625, -0.4751739501953125, -0.45616912841796875, -0.437164306640625, -0.41815948486328125, -0.3991546630859375, -0.38014984130859375, -0.36114501953125, -0.34214019775390625, -0.3231353759765625, -0.30413055419921875, -0.285125732421875, -0.26612091064453125, -0.2471160888671875, -0.22811126708984375, -0.2091064453125, -0.19010162353515625, -0.1710968017578125, -0.15209197998046875, -0.133087158203125, -0.11408233642578125, -0.0950775146484375, -0.07607269287109375, -0.05706787109375, -0.03806304931640625, -0.0190582275390625, -5.340576171875e-05, 0.018951416015625, 0.03795623779296875, 0.0569610595703125, 0.07596588134765625, 0.094970703125, 0.11397552490234375, 0.1329803466796875, 0.15198516845703125, 0.170989990234375, 0.18999481201171875, 0.2089996337890625, 0.22800445556640625, 0.24700927734375, 0.26601409912109375, 0.2850189208984375, 0.30402374267578125, 0.323028564453125, 0.34203338623046875, 0.3610382080078125, 0.38004302978515625, 0.3990478515625, 0.41805267333984375, 0.4370574951171875, 0.45606231689453125, 0.475067138671875, 0.49407196044921875, 0.5130767822265625, 0.5320816040039062, 0.55108642578125, 0.5700912475585938, 0.5890960693359375, 0.6081008911132812, 0.627105712890625, 0.6461105346679688, 0.6651153564453125, 0.6841201782226562, 0.703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 21.0, 898.0, 81.0, 7.0, 2.0, 0.0, 1.0], "bins": [-7.451050281524658, -7.324421405792236, -7.197792053222656, -7.071163177490234, -6.944533824920654, -6.817904949188232, -6.691275596618652, -6.5646467208862305, -6.438017845153809, -6.311388969421387, -6.184759616851807, -6.058130741119385, -5.931501388549805, -5.804872512817383, -5.678243637084961, -5.551614284515381, -5.424984931945801, -5.298356056213379, -5.171726703643799, -5.045097827911377, -4.918468475341797, -4.791839599609375, -4.665210723876953, -4.538581371307373, -4.411952495574951, -4.285323619842529, -4.158694267272949, -4.032065391540527, -3.9054362773895264, -3.7788071632385254, -3.6521780490875244, -3.5255489349365234, -3.3989200592041016, -3.2722909450531006, -3.1456618309020996, -3.0190329551696777, -2.8924038410186768, -2.765774726867676, -2.639145612716675, -2.512516498565674, -2.385887622833252, -2.259258508682251, -2.13262939453125, -2.006000518798828, -1.8793714046478271, -1.7527422904968262, -1.6261131763458252, -1.4994840621948242, -1.3728550672531128, -1.2462259531021118, -1.1195969581604004, -0.9929678440093994, -0.8663387894630432, -0.739709734916687, -0.613080620765686, -0.48645156621932983, -0.35982251167297363, -0.23319344222545624, -0.10656437277793884, 0.020064711570739746, 0.14669376611709595, 0.27332282066345215, 0.3999519348144531, 0.5265809893608093, 0.6532100439071655]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 3.0, 10.0, 7.0, 19.0, 12.0, 31.0, 68.0, 95.0, 123.0, 146.0, 148.0, 110.0, 73.0, 38.0, 28.0, 20.0, 6.0, 5.0, 6.0, 2.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.8338849544525146, -2.7452285289764404, -2.656571865081787, -2.567915439605713, -2.4792590141296387, -2.3906023502349854, -2.301945924758911, -2.213289260864258, -2.1246328353881836, -2.0359764099121094, -1.947319746017456, -1.8586633205413818, -1.770006775856018, -1.6813502311706543, -1.59269380569458, -1.5040372610092163, -1.4153807163238525, -1.3267241716384888, -1.238067626953125, -1.1494112014770508, -1.060754656791687, -0.9720981121063232, -0.8834416270256042, -0.7947851419448853, -0.7061285972595215, -0.6174720525741577, -0.5288155674934387, -0.44015905261039734, -0.35150253772735596, -0.2628460228443146, -0.1741895079612732, -0.0855330228805542, 0.0031232833862304688, 0.09177979826927185, 0.18043631315231323, 0.2690928280353546, 0.357749342918396, 0.4464058578014374, 0.5350623726844788, 0.6237188577651978, 0.7123754024505615, 0.8010319471359253, 0.8896884322166443, 0.9783449172973633, 1.067001461982727, 1.1556580066680908, 1.244314432144165, 1.3329709768295288, 1.4216275215148926, 1.5102840662002563, 1.5989406108856201, 1.6875970363616943, 1.776253581047058, 1.8649101257324219, 1.953566551208496, 2.0422229766845703, 2.1308796405792236, 2.219536066055298, 2.308192729949951, 2.3968491554260254, 2.4855055809020996, 2.574162244796753, 2.662818670272827, 2.7514753341674805, 2.8401317596435547]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 11.0, 12.0, 8.0, 22.0, 28.0, 28.0, 35.0, 64.0, 62.0, 102.0, 140.0, 195.0, 249.0, 361.0, 512.0, 701.0, 933.0, 1342.0, 1871.0, 2747.0, 4237.0, 6577.0, 11275.0, 23012.0, 556784.0, 384067.0, 22478.0, 11090.0, 6382.0, 3990.0, 2722.0, 1821.0, 1320.0, 934.0, 679.0, 474.0, 378.0, 214.0, 204.0, 137.0, 87.0, 65.0, 54.0, 26.0, 26.0, 29.0, 18.0, 8.0, 6.0, 11.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0], "bins": [-0.884765625, -0.857940673828125, -0.83111572265625, -0.804290771484375, -0.7774658203125, -0.750640869140625, -0.72381591796875, -0.696990966796875, -0.670166015625, -0.643341064453125, -0.61651611328125, -0.589691162109375, -0.5628662109375, -0.536041259765625, -0.50921630859375, -0.482391357421875, -0.45556640625, -0.428741455078125, -0.40191650390625, -0.375091552734375, -0.3482666015625, -0.321441650390625, -0.29461669921875, -0.267791748046875, -0.240966796875, -0.214141845703125, -0.18731689453125, -0.160491943359375, -0.1336669921875, -0.106842041015625, -0.08001708984375, -0.053192138671875, -0.0263671875, 0.000457763671875, 0.02728271484375, 0.054107666015625, 0.0809326171875, 0.107757568359375, 0.13458251953125, 0.161407470703125, 0.188232421875, 0.215057373046875, 0.24188232421875, 0.268707275390625, 0.2955322265625, 0.322357177734375, 0.34918212890625, 0.376007080078125, 0.40283203125, 0.429656982421875, 0.45648193359375, 0.483306884765625, 0.5101318359375, 0.536956787109375, 0.56378173828125, 0.590606689453125, 0.617431640625, 0.644256591796875, 0.67108154296875, 0.697906494140625, 0.7247314453125, 0.751556396484375, 0.77838134765625, 0.805206298828125, 0.83203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 8.0, 5.0, 11.0, 11.0, 10.0, 14.0, 83.0, 647.0, 76.0, 15.0, 13.0, 13.0, 7.0, 8.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.252685546875, -0.2445068359375, -0.236328125, -0.2281494140625, -0.219970703125, -0.2117919921875, -0.20361328125, -0.1954345703125, -0.187255859375, -0.1790771484375, -0.1708984375, -0.1627197265625, -0.154541015625, -0.1463623046875, -0.13818359375, -0.1300048828125, -0.121826171875, -0.1136474609375, -0.10546875, -0.0972900390625, -0.089111328125, -0.0809326171875, -0.07275390625, -0.0645751953125, -0.056396484375, -0.0482177734375, -0.0400390625, -0.0318603515625, -0.023681640625, -0.0155029296875, -0.00732421875, 0.0008544921875, 0.009033203125, 0.0172119140625, 0.025390625, 0.0335693359375, 0.041748046875, 0.0499267578125, 0.05810546875, 0.0662841796875, 0.074462890625, 0.0826416015625, 0.0908203125, 0.0989990234375, 0.107177734375, 0.1153564453125, 0.12353515625, 0.1317138671875, 0.139892578125, 0.1480712890625, 0.15625, 0.1644287109375, 0.172607421875, 0.1807861328125, 0.18896484375, 0.1971435546875, 0.205322265625, 0.2135009765625, 0.2216796875, 0.2298583984375, 0.238037109375, 0.2462158203125, 0.25439453125, 0.2625732421875, 0.270751953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 12.0, 9.0, 14.0, 10.0, 28.0, 26.0, 31.0, 46.0, 44.0, 75.0, 81.0, 120.0, 167.0, 203.0, 339.0, 890.0, 9175.0, 973709.0, 60423.0, 1664.0, 472.0, 246.0, 164.0, 129.0, 96.0, 77.0, 71.0, 46.0, 44.0, 30.0, 21.0, 17.0, 8.0, 11.0, 9.0, 6.0, 5.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.51171875, -2.4413604736328125, -2.371002197265625, -2.3006439208984375, -2.23028564453125, -2.1599273681640625, -2.089569091796875, -2.0192108154296875, -1.9488525390625, -1.8784942626953125, -1.808135986328125, -1.7377777099609375, -1.66741943359375, -1.5970611572265625, -1.526702880859375, -1.4563446044921875, -1.385986328125, -1.3156280517578125, -1.245269775390625, -1.1749114990234375, -1.10455322265625, -1.0341949462890625, -0.963836669921875, -0.8934783935546875, -0.8231201171875, -0.7527618408203125, -0.682403564453125, -0.6120452880859375, -0.54168701171875, -0.4713287353515625, -0.400970458984375, -0.3306121826171875, -0.26025390625, -0.1898956298828125, -0.119537353515625, -0.0491790771484375, 0.02117919921875, 0.0915374755859375, 0.161895751953125, 0.2322540283203125, 0.3026123046875, 0.3729705810546875, 0.443328857421875, 0.5136871337890625, 0.58404541015625, 0.6544036865234375, 0.724761962890625, 0.7951202392578125, 0.865478515625, 0.9358367919921875, 1.006195068359375, 1.0765533447265625, 1.14691162109375, 1.2172698974609375, 1.287628173828125, 1.3579864501953125, 1.4283447265625, 1.4987030029296875, 1.569061279296875, 1.6394195556640625, 1.70977783203125, 1.7801361083984375, 1.850494384765625, 1.9208526611328125, 1.9912109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 9.0, 7.0, 13.0, 7.0, 22.0, 10.0, 19.0, 28.0, 24.0, 30.0, 30.0, 35.0, 43.0, 38.0, 34.0, 39.0, 44.0, 47.0, 49.0, 44.0, 50.0, 36.0, 32.0, 39.0, 40.0, 30.0, 36.0, 24.0, 28.0, 18.0, 15.0, 14.0, 6.0, 9.0, 8.0, 6.0, 5.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.015625, -0.9871826171875, -0.958740234375, -0.9302978515625, -0.90185546875, -0.8734130859375, -0.844970703125, -0.8165283203125, -0.7880859375, -0.7596435546875, -0.731201171875, -0.7027587890625, -0.67431640625, -0.6458740234375, -0.617431640625, -0.5889892578125, -0.560546875, -0.5321044921875, -0.503662109375, -0.4752197265625, -0.44677734375, -0.4183349609375, -0.389892578125, -0.3614501953125, -0.3330078125, -0.3045654296875, -0.276123046875, -0.2476806640625, -0.21923828125, -0.1907958984375, -0.162353515625, -0.1339111328125, -0.10546875, -0.0770263671875, -0.048583984375, -0.0201416015625, 0.00830078125, 0.0367431640625, 0.065185546875, 0.0936279296875, 0.1220703125, 0.1505126953125, 0.178955078125, 0.2073974609375, 0.23583984375, 0.2642822265625, 0.292724609375, 0.3211669921875, 0.349609375, 0.3780517578125, 0.406494140625, 0.4349365234375, 0.46337890625, 0.4918212890625, 0.520263671875, 0.5487060546875, 0.5771484375, 0.6055908203125, 0.634033203125, 0.6624755859375, 0.69091796875, 0.7193603515625, 0.747802734375, 0.7762451171875, 0.8046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 5.0, 8.0, 11.0, 6.0, 25.0, 51.0, 61.0, 147.0, 239.0, 599.0, 1845.0, 12487.0, 997916.0, 30876.0, 2807.0, 785.0, 331.0, 154.0, 77.0, 41.0, 26.0, 20.0, 6.0, 9.0, 2.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025119781494140625, -0.002437293529510498, -0.0023626089096069336, -0.002287924289703369, -0.0022132396697998047, -0.0021385550498962402, -0.0020638704299926758, -0.0019891858100891113, -0.0019145011901855469, -0.0018398165702819824, -0.001765131950378418, -0.0016904473304748535, -0.001615762710571289, -0.0015410780906677246, -0.0014663934707641602, -0.0013917088508605957, -0.0013170242309570312, -0.0012423396110534668, -0.0011676549911499023, -0.0010929703712463379, -0.0010182857513427734, -0.000943601131439209, -0.0008689165115356445, -0.0007942318916320801, -0.0007195472717285156, -0.0006448626518249512, -0.0005701780319213867, -0.0004954934120178223, -0.0004208087921142578, -0.00034612417221069336, -0.0002714395523071289, -0.00019675493240356445, -0.0001220703125, -4.738569259643555e-05, 2.7298927307128906e-05, 0.00010198354721069336, 0.0001766681671142578, 0.00025135278701782227, 0.0003260374069213867, 0.00040072202682495117, 0.0004754066467285156, 0.0005500912666320801, 0.0006247758865356445, 0.000699460506439209, 0.0007741451263427734, 0.0008488297462463379, 0.0009235143661499023, 0.0009981989860534668, 0.0010728836059570312, 0.0011475682258605957, 0.0012222528457641602, 0.0012969374656677246, 0.001371622085571289, 0.0014463067054748535, 0.001520991325378418, 0.0015956759452819824, 0.0016703605651855469, 0.0017450451850891113, 0.0018197298049926758, 0.0018944144248962402, 0.0019690990447998047, 0.002043783664703369, 0.0021184682846069336, 0.002193152904510498, 0.0022678375244140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 12.0, 16.0, 21.0, 37.0, 46.0, 49.0, 58.0, 38.0, 89.0, 97.0, 111.0, 84.0, 92.0, 68.0, 53.0, 41.0, 27.0, 16.0, 15.0, 15.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -5.013309419155121e-06, -4.841014742851257e-06, -4.668720066547394e-06, -4.49642539024353e-06, -4.324130713939667e-06, -4.151836037635803e-06, -3.97954136133194e-06, -3.807246685028076e-06, -3.6349520087242126e-06, -3.462657332420349e-06, -3.2903626561164856e-06, -3.118067979812622e-06, -2.9457733035087585e-06, -2.773478627204895e-06, -2.6011839509010315e-06, -2.428889274597168e-06, -2.2565945982933044e-06, -2.084299921989441e-06, -1.9120052456855774e-06, -1.7397105693817139e-06, -1.5674158930778503e-06, -1.3951212167739868e-06, -1.2228265404701233e-06, -1.0505318641662598e-06, -8.782371878623962e-07, -7.059425115585327e-07, -5.336478352546692e-07, -3.6135315895080566e-07, -1.8905848264694214e-07, -1.6763806343078613e-08, 1.555308699607849e-07, 3.2782554626464844e-07, 5.00120222568512e-07, 6.724148988723755e-07, 8.44709575176239e-07, 1.0170042514801025e-06, 1.189298927783966e-06, 1.3615936040878296e-06, 1.5338882803916931e-06, 1.7061829566955566e-06, 1.8784776329994202e-06, 2.0507723093032837e-06, 2.2230669856071472e-06, 2.3953616619110107e-06, 2.5676563382148743e-06, 2.739951014518738e-06, 2.9122456908226013e-06, 3.084540367126465e-06, 3.2568350434303284e-06, 3.429129719734192e-06, 3.6014243960380554e-06, 3.773719072341919e-06, 3.9460137486457825e-06, 4.118308424949646e-06, 4.2906031012535095e-06, 4.462897777557373e-06, 4.6351924538612366e-06, 4.8074871301651e-06, 4.979781806468964e-06, 5.152076482772827e-06, 5.324371159076691e-06, 5.496665835380554e-06, 5.668960511684418e-06, 5.841255187988281e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 6.0, 7.0, 12.0, 16.0, 23.0, 25.0, 38.0, 53.0, 57.0, 108.0, 151.0, 204.0, 455.0, 2115.0, 828645.0, 213956.0, 1608.0, 382.0, 228.0, 120.0, 82.0, 73.0, 51.0, 40.0, 25.0, 12.0, 16.0, 10.0, 4.0, 7.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014581680297851562, -0.0014077872037887573, -0.0013574063777923584, -0.0013070255517959595, -0.0012566447257995605, -0.0012062638998031616, -0.0011558830738067627, -0.0011055022478103638, -0.0010551214218139648, -0.001004740595817566, -0.000954359769821167, -0.0009039789438247681, -0.0008535981178283691, -0.0008032172918319702, -0.0007528364658355713, -0.0007024556398391724, -0.0006520748138427734, -0.0006016939878463745, -0.0005513131618499756, -0.0005009323358535767, -0.00045055150985717773, -0.0004001706838607788, -0.0003497898578643799, -0.00029940903186798096, -0.00024902820587158203, -0.0001986473798751831, -0.00014826655387878418, -9.788572788238525e-05, -4.750490188598633e-05, 2.8759241104125977e-06, 5.3256750106811523e-05, 0.00010363757610321045, 0.00015401840209960938, 0.0002043992280960083, 0.0002547800540924072, 0.00030516088008880615, 0.0003555417060852051, 0.000405922532081604, 0.00045630335807800293, 0.0005066841840744019, 0.0005570650100708008, 0.0006074458360671997, 0.0006578266620635986, 0.0007082074880599976, 0.0007585883140563965, 0.0008089691400527954, 0.0008593499660491943, 0.0009097307920455933, 0.0009601116180419922, 0.0010104924440383911, 0.00106087327003479, 0.001111254096031189, 0.0011616349220275879, 0.0012120157480239868, 0.0012623965740203857, 0.0013127774000167847, 0.0013631582260131836, 0.0014135390520095825, 0.0014639198780059814, 0.0015143007040023804, 0.0015646815299987793, 0.0016150623559951782, 0.0016654431819915771, 0.001715824007987976, 0.001766204833984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 4.0, 5.0, 8.0, 11.0, 19.0, 14.0, 23.0, 29.0, 30.0, 36.0, 52.0, 45.0, 75.0, 89.0, 81.0, 68.0, 79.0, 62.0, 51.0, 33.0, 28.0, 35.0, 25.0, 29.0, 15.0, 5.0, 13.0, 8.0, 3.0, 7.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005893707275390625, -0.0005690157413482666, -0.0005486607551574707, -0.0005283057689666748, -0.0005079507827758789, -0.000487595796585083, -0.0004672408103942871, -0.0004468858242034912, -0.0004265308380126953, -0.0004061758518218994, -0.0003858208656311035, -0.0003654658794403076, -0.0003451108932495117, -0.0003247559070587158, -0.0003044009208679199, -0.000284045934677124, -0.0002636909484863281, -0.00024333596229553223, -0.00022298097610473633, -0.00020262598991394043, -0.00018227100372314453, -0.00016191601753234863, -0.00014156103134155273, -0.00012120604515075684, -0.00010085105895996094, -8.049607276916504e-05, -6.014108657836914e-05, -3.978610038757324e-05, -1.9431114196777344e-05, 9.238719940185547e-07, 2.1278858184814453e-05, 4.163384437561035e-05, 6.198883056640625e-05, 8.234381675720215e-05, 0.00010269880294799805, 0.00012305378913879395, 0.00014340877532958984, 0.00016376376152038574, 0.00018411874771118164, 0.00020447373390197754, 0.00022482872009277344, 0.00024518370628356934, 0.00026553869247436523, 0.00028589367866516113, 0.00030624866485595703, 0.00032660365104675293, 0.00034695863723754883, 0.0003673136234283447, 0.0003876686096191406, 0.0004080235958099365, 0.0004283785820007324, 0.0004487335681915283, 0.0004690885543823242, 0.0004894435405731201, 0.000509798526763916, 0.0005301535129547119, 0.0005505084991455078, 0.0005708634853363037, 0.0005912184715270996, 0.0006115734577178955, 0.0006319284439086914, 0.0006522834300994873, 0.0006726384162902832, 0.0006929934024810791, 0.000713348388671875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 803.0, 215.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.245146751403809, -2.0955421924591064, 0.0540623664855957, 2.2036666870117188, 4.353271484375, 6.502876281738281, 8.652480125427246, 10.802084922790527, 12.951689720153809, 15.10129451751709, 17.250898361206055, 19.400503158569336, 21.550107955932617, 23.6997127532959, 25.849315643310547, 27.998920440673828, 30.14852523803711, 32.29813003540039, 34.44773483276367, 36.59733963012695, 38.746944427490234, 40.896549224853516, 43.04615020751953, 45.19575500488281, 47.34536361694336, 49.49496841430664, 51.64457321166992, 53.7941780090332, 55.943782806396484, 58.093387603759766, 60.24298858642578, 62.39259338378906, 64.54219818115234, 66.69180297851562, 68.8414077758789, 70.99101257324219, 73.14061737060547, 75.29022216796875, 77.43982696533203, 79.58943176269531, 81.7390365600586, 83.88864135742188, 86.03824615478516, 88.18785095214844, 90.33745574951172, 92.487060546875, 94.63666534423828, 96.78627014160156, 98.93586730957031, 101.0854721069336, 103.23507690429688, 105.38468170166016, 107.53428649902344, 109.68389129638672, 111.83349609375, 113.98310089111328, 116.13270568847656, 118.28231048583984, 120.43191528320312, 122.5815200805664, 124.73112487792969, 126.88072967529297, 129.03033447265625, 131.179931640625, 133.3295440673828]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 13.0, 13.0, 12.0, 22.0, 21.0, 39.0, 35.0, 57.0, 47.0, 64.0, 74.0, 75.0, 77.0, 87.0, 54.0, 47.0, 65.0, 44.0, 29.0, 25.0, 18.0, 15.0, 7.0, 5.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.525471687316895, -8.257101058959961, -7.988729476928711, -7.720358371734619, -7.451987266540527, -7.1836161613464355, -6.915245056152344, -6.646873950958252, -6.37850284576416, -6.110131740570068, -5.841760635375977, -5.573389530181885, -5.305018424987793, -5.036647319793701, -4.768276214599609, -4.499905109405518, -4.231534004211426, -3.963162899017334, -3.694791793823242, -3.4264206886291504, -3.1580495834350586, -2.889678478240967, -2.621307373046875, -2.352936267852783, -2.0845651626586914, -1.8161940574645996, -1.5478229522705078, -1.279451847076416, -1.0110807418823242, -0.7427096366882324, -0.4743385314941406, -0.20596742630004883, 0.062404632568359375, 0.33077573776245117, 0.599146842956543, 0.8675179481506348, 1.1358890533447266, 1.4042601585388184, 1.6726312637329102, 1.941002368927002, 2.2093734741210938, 2.4777445793151855, 2.7461156845092773, 3.014486789703369, 3.282857894897461, 3.5512290000915527, 3.8196001052856445, 4.087971210479736, 4.356342315673828, 4.62471342086792, 4.893084526062012, 5.1614556312561035, 5.429826736450195, 5.698197841644287, 5.966568946838379, 6.234940052032471, 6.5033111572265625, 6.771682262420654, 7.040053367614746, 7.308424472808838, 7.57679557800293, 7.8451666831970215, 8.113537788391113, 8.381908416748047, 8.650279998779297]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 14.0, 12.0, 14.0, 31.0, 51.0, 73.0, 109.0, 174.0, 311.0, 541.0, 1043.0, 2322.0, 6217.0, 48993.0, 4110331.0, 13287.0, 5078.0, 2473.0, 1283.0, 732.0, 431.0, 250.0, 163.0, 101.0, 75.0, 37.0, 37.0, 27.0, 11.0, 11.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.291015625, -2.217681884765625, -2.14434814453125, -2.071014404296875, -1.9976806640625, -1.924346923828125, -1.85101318359375, -1.777679443359375, -1.704345703125, -1.631011962890625, -1.55767822265625, -1.484344482421875, -1.4110107421875, -1.337677001953125, -1.26434326171875, -1.191009521484375, -1.11767578125, -1.044342041015625, -0.97100830078125, -0.897674560546875, -0.8243408203125, -0.751007080078125, -0.67767333984375, -0.604339599609375, -0.531005859375, -0.457672119140625, -0.38433837890625, -0.311004638671875, -0.2376708984375, -0.164337158203125, -0.09100341796875, -0.017669677734375, 0.0556640625, 0.128997802734375, 0.20233154296875, 0.275665283203125, 0.3489990234375, 0.422332763671875, 0.49566650390625, 0.569000244140625, 0.642333984375, 0.715667724609375, 0.78900146484375, 0.862335205078125, 0.9356689453125, 1.009002685546875, 1.08233642578125, 1.155670166015625, 1.22900390625, 1.302337646484375, 1.37567138671875, 1.449005126953125, 1.5223388671875, 1.595672607421875, 1.66900634765625, 1.742340087890625, 1.815673828125, 1.889007568359375, 1.96234130859375, 2.035675048828125, 2.1090087890625, 2.182342529296875, 2.25567626953125, 2.329010009765625, 2.40234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 5.0, 7.0, 10.0, 10.0, 12.0, 41.0, 470.0, 289.0, 29.0, 11.0, 8.0, 4.0, 11.0, 6.0, 5.0, 3.0, 4.0, 4.0, 6.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2353515625, -0.22782516479492188, -0.22029876708984375, -0.21277236938476562, -0.2052459716796875, -0.19771957397460938, -0.19019317626953125, -0.18266677856445312, -0.175140380859375, -0.16761398315429688, -0.16008758544921875, -0.15256118774414062, -0.1450347900390625, -0.13750839233398438, -0.12998199462890625, -0.12245559692382812, -0.11492919921875, -0.10740280151367188, -0.09987640380859375, -0.09235000610351562, -0.0848236083984375, -0.07729721069335938, -0.06977081298828125, -0.062244415283203125, -0.054718017578125, -0.047191619873046875, -0.03966522216796875, -0.032138824462890625, -0.0246124267578125, -0.017086029052734375, -0.00955963134765625, -0.002033233642578125, 0.0054931640625, 0.013019561767578125, 0.02054595947265625, 0.028072357177734375, 0.0355987548828125, 0.043125152587890625, 0.05065155029296875, 0.058177947998046875, 0.065704345703125, 0.07323074340820312, 0.08075714111328125, 0.08828353881835938, 0.0958099365234375, 0.10333633422851562, 0.11086273193359375, 0.11838912963867188, 0.12591552734375, 0.13344192504882812, 0.14096832275390625, 0.14849472045898438, 0.1560211181640625, 0.16354751586914062, 0.17107391357421875, 0.17860031127929688, 0.186126708984375, 0.19365310668945312, 0.20117950439453125, 0.20870590209960938, 0.2162322998046875, 0.22375869750976562, 0.23128509521484375, 0.23881149291992188, 0.246337890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 9.0, 10.0, 17.0, 11.0, 20.0, 28.0, 40.0, 63.0, 78.0, 136.0, 267.0, 655.0, 4381.0, 4136599.0, 49251.0, 1713.0, 429.0, 203.0, 108.0, 67.0, 46.0, 32.0, 25.0, 20.0, 14.0, 13.0, 8.0, 10.0, 3.0, 7.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.52734375, -5.36376953125, -5.2001953125, -5.03662109375, -4.873046875, -4.70947265625, -4.5458984375, -4.38232421875, -4.21875, -4.05517578125, -3.8916015625, -3.72802734375, -3.564453125, -3.40087890625, -3.2373046875, -3.07373046875, -2.91015625, -2.74658203125, -2.5830078125, -2.41943359375, -2.255859375, -2.09228515625, -1.9287109375, -1.76513671875, -1.6015625, -1.43798828125, -1.2744140625, -1.11083984375, -0.947265625, -0.78369140625, -0.6201171875, -0.45654296875, -0.29296875, -0.12939453125, 0.0341796875, 0.19775390625, 0.361328125, 0.52490234375, 0.6884765625, 0.85205078125, 1.015625, 1.17919921875, 1.3427734375, 1.50634765625, 1.669921875, 1.83349609375, 1.9970703125, 2.16064453125, 2.32421875, 2.48779296875, 2.6513671875, 2.81494140625, 2.978515625, 3.14208984375, 3.3056640625, 3.46923828125, 3.6328125, 3.79638671875, 3.9599609375, 4.12353515625, 4.287109375, 4.45068359375, 4.6142578125, 4.77783203125, 4.94140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 9.0, 19.0, 23.0, 23.0, 37.0, 51.0, 56.0, 97.0, 398.0, 2957.0, 106.0, 59.0, 51.0, 40.0, 21.0, 18.0, 18.0, 15.0, 7.0, 12.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8239898681640625, -0.799835205078125, -0.7756805419921875, -0.75152587890625, -0.7273712158203125, -0.703216552734375, -0.6790618896484375, -0.6549072265625, -0.6307525634765625, -0.606597900390625, -0.5824432373046875, -0.55828857421875, -0.5341339111328125, -0.509979248046875, -0.4858245849609375, -0.461669921875, -0.4375152587890625, -0.413360595703125, -0.3892059326171875, -0.36505126953125, -0.3408966064453125, -0.316741943359375, -0.2925872802734375, -0.2684326171875, -0.2442779541015625, -0.220123291015625, -0.1959686279296875, -0.17181396484375, -0.1476593017578125, -0.123504638671875, -0.0993499755859375, -0.0751953125, -0.0510406494140625, -0.026885986328125, -0.0027313232421875, 0.02142333984375, 0.0455780029296875, 0.069732666015625, 0.0938873291015625, 0.1180419921875, 0.1421966552734375, 0.166351318359375, 0.1905059814453125, 0.21466064453125, 0.2388153076171875, 0.262969970703125, 0.2871246337890625, 0.311279296875, 0.3354339599609375, 0.359588623046875, 0.3837432861328125, 0.40789794921875, 0.4320526123046875, 0.456207275390625, 0.4803619384765625, 0.5045166015625, 0.5286712646484375, 0.552825927734375, 0.5769805908203125, 0.60113525390625, 0.6252899169921875, 0.649444580078125, 0.6735992431640625, 0.69775390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 12.0, 44.0, 694.0, 231.0, 22.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662229537963867, -3.5942065715789795, -3.5261833667755127, -3.458160400390625, -3.390137195587158, -3.3221142292022705, -3.2540910243988037, -3.186068058013916, -3.118044853210449, -3.0500218868255615, -2.9819986820220947, -2.913975715637207, -2.8459525108337402, -2.7779295444488525, -2.7099063396453857, -2.641883373260498, -2.5738601684570312, -2.5058372020721436, -2.4378139972686768, -2.369791030883789, -2.3017678260803223, -2.2337448596954346, -2.1657216548919678, -2.09769868850708, -2.0296757221221924, -1.9616526365280151, -1.893629550933838, -1.8256064653396606, -1.7575833797454834, -1.6895602941513062, -1.621537208557129, -1.5535142421722412, -1.485491156578064, -1.4174680709838867, -1.3494449853897095, -1.2814218997955322, -1.213398814201355, -1.1453757286071777, -1.07735276222229, -1.0093295574188232, -0.9413065314292908, -0.8732834458351135, -0.8052603602409363, -0.7372373342514038, -0.6692142486572266, -0.6011911630630493, -0.5331680774688721, -0.4651449918746948, -0.3971219062805176, -0.32909882068634033, -0.2610757350921631, -0.19305267930030823, -0.12502959370613098, -0.057006508111953735, 0.011016547679901123, 0.07903963327407837, 0.14706271886825562, 0.21508580446243286, 0.2831088900566101, 0.35113194584846497, 0.4191550314426422, 0.48717811703681946, 0.5552011728286743, 0.6232242584228516, 0.6912473440170288]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 1.0, 4.0, 4.0, 6.0, 6.0, 21.0, 23.0, 36.0, 40.0, 62.0, 96.0, 108.0, 120.0, 108.0, 98.0, 69.0, 64.0, 50.0, 23.0, 19.0, 13.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0955047607421875, -3.9763007164001465, -3.8570964336395264, -3.7378923892974854, -3.6186883449554443, -3.499484062194824, -3.380280017852783, -3.261075973510742, -3.141871929168701, -3.02266788482666, -2.90346360206604, -2.784259557723999, -2.665055513381958, -2.545851230621338, -2.426647186279297, -2.307443141937256, -2.188239097595215, -2.069035053253174, -1.9498308897018433, -1.8306267261505127, -1.7114226818084717, -1.5922185182571411, -1.4730143547058105, -1.3538103103637695, -1.2346060276031494, -1.1154018640518188, -0.9961978197097778, -0.8769936561584473, -0.7577896118164062, -0.6385854482650757, -0.5193813443183899, -0.4001772403717041, -0.2809731960296631, -0.1617690920829773, -0.04256497323513031, 0.07663914561271667, 0.19584324955940247, 0.31504738330841064, 0.43425148725509644, 0.5534555912017822, 0.672659695148468, 0.7918637990951538, 0.9110679030418396, 1.0302720069885254, 1.149476170539856, 1.2686803340911865, 1.3878843784332275, 1.5070884227752686, 1.6262925863265991, 1.7454967498779297, 1.8647007942199707, 1.9839049577713013, 2.103109121322632, 2.222313165664673, 2.341517210006714, 2.460721492767334, 2.579925537109375, 2.699129581451416, 2.818333864212036, 2.937537908554077, 3.056741952896118, 3.1759462356567383, 3.2951502799987793, 3.4143543243408203, 3.5335583686828613]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 11.0, 11.0, 10.0, 19.0, 27.0, 23.0, 42.0, 50.0, 51.0, 68.0, 86.0, 128.0, 154.0, 201.0, 260.0, 418.0, 511.0, 701.0, 988.0, 1410.0, 2189.0, 3198.0, 4883.0, 8453.0, 16665.0, 82523.0, 865068.0, 29328.0, 11733.0, 6510.0, 3814.0, 2547.0, 1688.0, 1187.0, 869.0, 665.0, 463.0, 356.0, 301.0, 203.0, 155.0, 135.0, 109.0, 85.0, 59.0, 55.0, 32.0, 32.0, 28.0, 13.0, 20.0, 6.0, 7.0, 8.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.638671875, -0.6188812255859375, -0.599090576171875, -0.5792999267578125, -0.55950927734375, -0.5397186279296875, -0.519927978515625, -0.5001373291015625, -0.4803466796875, -0.4605560302734375, -0.440765380859375, -0.4209747314453125, -0.40118408203125, -0.3813934326171875, -0.361602783203125, -0.3418121337890625, -0.322021484375, -0.3022308349609375, -0.282440185546875, -0.2626495361328125, -0.24285888671875, -0.2230682373046875, -0.203277587890625, -0.1834869384765625, -0.1636962890625, -0.1439056396484375, -0.124114990234375, -0.1043243408203125, -0.08453369140625, -0.0647430419921875, -0.044952392578125, -0.0251617431640625, -0.00537109375, 0.0144195556640625, 0.034210205078125, 0.0540008544921875, 0.07379150390625, 0.0935821533203125, 0.113372802734375, 0.1331634521484375, 0.1529541015625, 0.1727447509765625, 0.192535400390625, 0.2123260498046875, 0.23211669921875, 0.2519073486328125, 0.271697998046875, 0.2914886474609375, 0.311279296875, 0.3310699462890625, 0.350860595703125, 0.3706512451171875, 0.39044189453125, 0.4102325439453125, 0.430023193359375, 0.4498138427734375, 0.4696044921875, 0.4893951416015625, 0.509185791015625, 0.5289764404296875, 0.54876708984375, 0.5685577392578125, 0.588348388671875, 0.6081390380859375, 0.6279296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 9.0, 4.0, 7.0, 5.0, 9.0, 8.0, 7.0, 6.0, 19.0, 69.0, 403.0, 308.0, 36.0, 17.0, 8.0, 8.0, 5.0, 5.0, 7.0, 7.0, 1.0, 5.0, 3.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.2139892578125, -0.2073650360107422, -0.20074081420898438, -0.19411659240722656, -0.18749237060546875, -0.18086814880371094, -0.17424392700195312, -0.1676197052001953, -0.1609954833984375, -0.1543712615966797, -0.14774703979492188, -0.14112281799316406, -0.13449859619140625, -0.12787437438964844, -0.12125015258789062, -0.11462593078613281, -0.108001708984375, -0.10137748718261719, -0.09475326538085938, -0.08812904357910156, -0.08150482177734375, -0.07488059997558594, -0.06825637817382812, -0.06163215637207031, -0.0550079345703125, -0.04838371276855469, -0.041759490966796875, -0.03513526916503906, -0.02851104736328125, -0.021886825561523438, -0.015262603759765625, -0.008638381958007812, -0.00201416015625, 0.0046100616455078125, 0.011234283447265625, 0.017858505249023438, 0.02448272705078125, 0.031106948852539062, 0.037731170654296875, 0.04435539245605469, 0.0509796142578125, 0.05760383605957031, 0.06422805786132812, 0.07085227966308594, 0.07747650146484375, 0.08410072326660156, 0.09072494506835938, 0.09734916687011719, 0.103973388671875, 0.11059761047363281, 0.11722183227539062, 0.12384605407714844, 0.13047027587890625, 0.13709449768066406, 0.14371871948242188, 0.1503429412841797, 0.1569671630859375, 0.1635913848876953, 0.17021560668945312, 0.17683982849121094, 0.18346405029296875, 0.19008827209472656, 0.19671249389648438, 0.2033367156982422, 0.2099609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 17.0, 19.0, 18.0, 14.0, 20.0, 39.0, 54.0, 68.0, 67.0, 107.0, 107.0, 130.0, 217.0, 271.0, 716.0, 7407.0, 1001180.0, 35489.0, 1258.0, 371.0, 215.0, 159.0, 119.0, 103.0, 69.0, 60.0, 62.0, 42.0, 34.0, 24.0, 15.0, 17.0, 21.0, 8.0, 9.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.6015625, -2.52862548828125, -2.4556884765625, -2.38275146484375, -2.309814453125, -2.23687744140625, -2.1639404296875, -2.09100341796875, -2.01806640625, -1.94512939453125, -1.8721923828125, -1.79925537109375, -1.726318359375, -1.65338134765625, -1.5804443359375, -1.50750732421875, -1.4345703125, -1.36163330078125, -1.2886962890625, -1.21575927734375, -1.142822265625, -1.06988525390625, -0.9969482421875, -0.92401123046875, -0.85107421875, -0.77813720703125, -0.7052001953125, -0.63226318359375, -0.559326171875, -0.48638916015625, -0.4134521484375, -0.34051513671875, -0.267578125, -0.19464111328125, -0.1217041015625, -0.04876708984375, 0.024169921875, 0.09710693359375, 0.1700439453125, 0.24298095703125, 0.31591796875, 0.38885498046875, 0.4617919921875, 0.53472900390625, 0.607666015625, 0.68060302734375, 0.7535400390625, 0.82647705078125, 0.8994140625, 0.97235107421875, 1.0452880859375, 1.11822509765625, 1.191162109375, 1.26409912109375, 1.3370361328125, 1.40997314453125, 1.48291015625, 1.55584716796875, 1.6287841796875, 1.70172119140625, 1.774658203125, 1.84759521484375, 1.9205322265625, 1.99346923828125, 2.06640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 14.0, 14.0, 7.0, 11.0, 20.0, 20.0, 24.0, 27.0, 48.0, 34.0, 35.0, 44.0, 36.0, 51.0, 59.0, 43.0, 46.0, 44.0, 51.0, 54.0, 43.0, 34.0, 32.0, 26.0, 22.0, 20.0, 21.0, 20.0, 16.0, 12.0, 13.0, 16.0, 4.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7920913696289062, -0.7692413330078125, -0.7463912963867188, -0.723541259765625, -0.7006912231445312, -0.6778411865234375, -0.6549911499023438, -0.63214111328125, -0.6092910766601562, -0.5864410400390625, -0.5635910034179688, -0.540740966796875, -0.5178909301757812, -0.4950408935546875, -0.47219085693359375, -0.4493408203125, -0.42649078369140625, -0.4036407470703125, -0.38079071044921875, -0.357940673828125, -0.33509063720703125, -0.3122406005859375, -0.28939056396484375, -0.26654052734375, -0.24369049072265625, -0.2208404541015625, -0.19799041748046875, -0.175140380859375, -0.15229034423828125, -0.1294403076171875, -0.10659027099609375, -0.083740234375, -0.06089019775390625, -0.0380401611328125, -0.01519012451171875, 0.007659912109375, 0.03050994873046875, 0.0533599853515625, 0.07621002197265625, 0.09906005859375, 0.12191009521484375, 0.1447601318359375, 0.16761016845703125, 0.190460205078125, 0.21331024169921875, 0.2361602783203125, 0.25901031494140625, 0.2818603515625, 0.30471038818359375, 0.3275604248046875, 0.35041046142578125, 0.373260498046875, 0.39611053466796875, 0.4189605712890625, 0.44181060791015625, 0.46466064453125, 0.48751068115234375, 0.5103607177734375, 0.5332107543945312, 0.556060791015625, 0.5789108276367188, 0.6017608642578125, 0.6246109008789062, 0.6474609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 12.0, 9.0, 15.0, 22.0, 37.0, 52.0, 109.0, 197.0, 400.0, 949.0, 2928.0, 25413.0, 988891.0, 24886.0, 2935.0, 849.0, 408.0, 188.0, 114.0, 52.0, 35.0, 24.0, 14.0, 15.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001796722412109375, -0.0017358064651489258, -0.0016748905181884766, -0.0016139745712280273, -0.0015530586242675781, -0.001492142677307129, -0.0014312267303466797, -0.0013703107833862305, -0.0013093948364257812, -0.001248478889465332, -0.0011875629425048828, -0.0011266469955444336, -0.0010657310485839844, -0.0010048151016235352, -0.0009438991546630859, -0.0008829832077026367, -0.0008220672607421875, -0.0007611513137817383, -0.0007002353668212891, -0.0006393194198608398, -0.0005784034729003906, -0.0005174875259399414, -0.0004565715789794922, -0.00039565563201904297, -0.00033473968505859375, -0.00027382373809814453, -0.0002129077911376953, -0.0001519918441772461, -9.107589721679688e-05, -3.0159950256347656e-05, 3.075599670410156e-05, 9.167194366455078e-05, 0.000152587890625, 0.00021350383758544922, 0.00027441978454589844, 0.00033533573150634766, 0.0003962516784667969, 0.0004571676254272461, 0.0005180835723876953, 0.0005789995193481445, 0.0006399154663085938, 0.000700831413269043, 0.0007617473602294922, 0.0008226633071899414, 0.0008835792541503906, 0.0009444952011108398, 0.001005411148071289, 0.0010663270950317383, 0.0011272430419921875, 0.0011881589889526367, 0.001249074935913086, 0.0013099908828735352, 0.0013709068298339844, 0.0014318227767944336, 0.0014927387237548828, 0.001553654670715332, 0.0016145706176757812, 0.0016754865646362305, 0.0017364025115966797, 0.001797318458557129, 0.0018582344055175781, 0.0019191503524780273, 0.0019800662994384766, 0.0020409822463989258, 0.002101898193359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 17.0, 16.0, 24.0, 14.0, 45.0, 56.0, 69.0, 74.0, 59.0, 90.0, 103.0, 72.0, 82.0, 73.0, 26.0, 46.0, 27.0, 25.0, 24.0, 11.0, 8.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.079673767089844e-06, -5.911104381084442e-06, -5.7425349950790405e-06, -5.573965609073639e-06, -5.405396223068237e-06, -5.236826837062836e-06, -5.068257451057434e-06, -4.8996880650520325e-06, -4.731118679046631e-06, -4.562549293041229e-06, -4.393979907035828e-06, -4.225410521030426e-06, -4.056841135025024e-06, -3.888271749019623e-06, -3.719702363014221e-06, -3.5511329770088196e-06, -3.382563591003418e-06, -3.2139942049980164e-06, -3.0454248189926147e-06, -2.876855432987213e-06, -2.7082860469818115e-06, -2.53971666097641e-06, -2.3711472749710083e-06, -2.2025778889656067e-06, -2.034008502960205e-06, -1.8654391169548035e-06, -1.6968697309494019e-06, -1.5283003449440002e-06, -1.3597309589385986e-06, -1.191161572933197e-06, -1.0225921869277954e-06, -8.540228009223938e-07, -6.854534149169922e-07, -5.168840289115906e-07, -3.4831464290618896e-07, -1.7974525690078735e-07, -1.1175870895385742e-08, 1.5739351511001587e-07, 3.259629011154175e-07, 4.945322871208191e-07, 6.631016731262207e-07, 8.316710591316223e-07, 1.000240445137024e-06, 1.1688098311424255e-06, 1.3373792171478271e-06, 1.5059486031532288e-06, 1.6745179891586304e-06, 1.843087375164032e-06, 2.0116567611694336e-06, 2.180226147174835e-06, 2.348795533180237e-06, 2.5173649191856384e-06, 2.68593430519104e-06, 2.8545036911964417e-06, 3.0230730772018433e-06, 3.191642463207245e-06, 3.3602118492126465e-06, 3.528781235218048e-06, 3.6973506212234497e-06, 3.865920007228851e-06, 4.034489393234253e-06, 4.2030587792396545e-06, 4.371628165245056e-06, 4.540197551250458e-06, 4.708766937255859e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 5.0, 7.0, 12.0, 11.0, 33.0, 31.0, 54.0, 65.0, 104.0, 156.0, 237.0, 500.0, 3724.0, 1026199.0, 15731.0, 823.0, 278.0, 175.0, 116.0, 75.0, 47.0, 30.0, 29.0, 22.0, 12.0, 17.0, 7.0, 8.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024929046630859375, -0.002411574125289917, -0.0023302435874938965, -0.002248913049697876, -0.0021675825119018555, -0.002086251974105835, -0.0020049214363098145, -0.001923590898513794, -0.0018422603607177734, -0.001760929822921753, -0.0016795992851257324, -0.001598268747329712, -0.0015169382095336914, -0.001435607671737671, -0.0013542771339416504, -0.0012729465961456299, -0.0011916160583496094, -0.0011102855205535889, -0.0010289549827575684, -0.0009476244449615479, -0.0008662939071655273, -0.0007849633693695068, -0.0007036328315734863, -0.0006223022937774658, -0.0005409717559814453, -0.0004596412181854248, -0.0003783106803894043, -0.0002969801425933838, -0.00021564960479736328, -0.00013431906700134277, -5.2988529205322266e-05, 2.8342008590698242e-05, 0.00010967254638671875, 0.00019100308418273926, 0.00027233362197875977, 0.0003536641597747803, 0.0004349946975708008, 0.0005163252353668213, 0.0005976557731628418, 0.0006789863109588623, 0.0007603168487548828, 0.0008416473865509033, 0.0009229779243469238, 0.0010043084621429443, 0.0010856389999389648, 0.0011669695377349854, 0.0012483000755310059, 0.0013296306133270264, 0.0014109611511230469, 0.0014922916889190674, 0.0015736222267150879, 0.0016549527645111084, 0.001736283302307129, 0.0018176138401031494, 0.00189894437789917, 0.0019802749156951904, 0.002061605453491211, 0.0021429359912872314, 0.002224266529083252, 0.0023055970668792725, 0.002386927604675293, 0.0024682581424713135, 0.002549588680267334, 0.0026309192180633545, 0.002712249755859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 15.0, 20.0, 32.0, 30.0, 45.0, 39.0, 62.0, 86.0, 77.0, 93.0, 99.0, 78.0, 72.0, 56.0, 38.0, 31.0, 25.0, 16.0, 14.0, 12.0, 6.0, 8.0, 5.0, 7.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007805824279785156, -0.0007551088929176331, -0.0007296353578567505, -0.0007041618227958679, -0.0006786882877349854, -0.0006532147526741028, -0.0006277412176132202, -0.0006022676825523376, -0.0005767941474914551, -0.0005513206124305725, -0.0005258470773696899, -0.0005003735423088074, -0.0004749000072479248, -0.00044942647218704224, -0.00042395293712615967, -0.0003984794020652771, -0.00037300586700439453, -0.00034753233194351196, -0.0003220587968826294, -0.0002965852618217468, -0.00027111172676086426, -0.0002456381916999817, -0.00022016465663909912, -0.00019469112157821655, -0.00016921758651733398, -0.00014374405145645142, -0.00011827051639556885, -9.279698133468628e-05, -6.732344627380371e-05, -4.184991121292114e-05, -1.6376376152038574e-05, 9.097158908843994e-06, 3.457069396972656e-05, 6.004422903060913e-05, 8.55177640914917e-05, 0.00011099129915237427, 0.00013646483421325684, 0.0001619383692741394, 0.00018741190433502197, 0.00021288543939590454, 0.0002383589744567871, 0.0002638325095176697, 0.00028930604457855225, 0.0003147795796394348, 0.0003402531147003174, 0.00036572664976119995, 0.0003912001848220825, 0.0004166737198829651, 0.00044214725494384766, 0.0004676207900047302, 0.0004930943250656128, 0.0005185678601264954, 0.0005440413951873779, 0.0005695149302482605, 0.0005949884653091431, 0.0006204620003700256, 0.0006459355354309082, 0.0006714090704917908, 0.0006968826055526733, 0.0007223561406135559, 0.0007478296756744385, 0.000773303210735321, 0.0007987767457962036, 0.0008242502808570862, 0.0008497238159179688]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 28.0, 934.0, 54.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.134574890136719, -4.726897239685059, -4.319219589233398, -3.91154146194458, -3.50386381149292, -3.0961861610412598, -2.6885082721710205, -2.2808303833007812, -1.873152732849121, -1.4654749631881714, -1.0577971935272217, -0.650119423866272, -0.24244165420532227, 0.1652359962463379, 0.5729138851165771, 0.9805917739868164, 1.3882694244384766, 1.7959471940994263, 2.203624963760376, 2.6113028526306152, 3.0189805030822754, 3.4266581535339355, 3.834336042404175, 4.242013931274414, 4.649691581726074, 5.057369232177734, 5.4650468826293945, 5.872725009918213, 6.280402660369873, 6.688080310821533, 7.095758438110352, 7.503436088562012, 7.911113739013672, 8.318791389465332, 8.726469039916992, 9.134146690368652, 9.541824340820312, 9.949502944946289, 10.35718059539795, 10.76485824584961, 11.17253589630127, 11.58021354675293, 11.98789119720459, 12.39556884765625, 12.803247451782227, 13.21092414855957, 13.618602752685547, 14.026280403137207, 14.433958053588867, 14.841635704040527, 15.249313354492188, 15.656991004943848, 16.064668655395508, 16.472347259521484, 16.880023956298828, 17.287702560424805, 17.69538116455078, 18.103059768676758, 18.5107364654541, 18.918415069580078, 19.326091766357422, 19.7337703704834, 20.141447067260742, 20.54912567138672, 20.956802368164062]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 12.0, 12.0, 15.0, 20.0, 21.0, 34.0, 29.0, 45.0, 32.0, 52.0, 54.0, 51.0, 53.0, 67.0, 52.0, 76.0, 62.0, 55.0, 48.0, 39.0, 32.0, 29.0, 30.0, 10.0, 15.0, 10.0, 8.0, 6.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.527304649353027, -5.335773944854736, -5.144243240356445, -4.952712535858154, -4.761181831359863, -4.569651126861572, -4.378120422363281, -4.186590194702148, -3.9950592517852783, -3.8035285472869873, -3.6119978427886963, -3.4204673767089844, -3.2289366722106934, -3.0374059677124023, -2.8458752632141113, -2.6543445587158203, -2.4628138542175293, -2.2712831497192383, -2.0797524452209473, -1.8882218599319458, -1.6966911554336548, -1.5051604509353638, -1.3136298656463623, -1.1220991611480713, -0.9305684566497803, -0.7390377521514893, -0.547507107257843, -0.3559764623641968, -0.16444575786590576, 0.027084946632385254, 0.21861553192138672, 0.41014623641967773, 0.601677417755127, 0.793208122253418, 0.9847387671470642, 1.1762694120407104, 1.3678001165390015, 1.5593308210372925, 1.750861406326294, 1.942392110824585, 2.133922815322876, 2.325453519821167, 2.516984224319458, 2.70851469039917, 2.900045394897461, 3.091576099395752, 3.283106803894043, 3.474637508392334, 3.666168212890625, 3.857698917388916, 4.049229621887207, 4.240760326385498, 4.432291030883789, 4.62382173538208, 4.815352439880371, 5.006882667541504, 5.198413848876953, 5.389944553375244, 5.581475257873535, 5.773005962371826, 5.964536666870117, 6.156067371368408, 6.347598075866699, 6.539128303527832, 6.730659008026123]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 8.0, 10.0, 9.0, 9.0, 14.0, 26.0, 52.0, 91.0, 190.0, 607.0, 2451.0, 4173154.0, 14705.0, 1771.0, 610.0, 241.0, 119.0, 89.0, 22.0, 22.0, 10.0, 12.0, 8.0, 8.0, 4.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.39453125, -3.287811279296875, -3.18109130859375, -3.074371337890625, -2.9676513671875, -2.860931396484375, -2.75421142578125, -2.647491455078125, -2.540771484375, -2.434051513671875, -2.32733154296875, -2.220611572265625, -2.1138916015625, -2.007171630859375, -1.90045166015625, -1.793731689453125, -1.68701171875, -1.580291748046875, -1.47357177734375, -1.366851806640625, -1.2601318359375, -1.153411865234375, -1.04669189453125, -0.939971923828125, -0.833251953125, -0.726531982421875, -0.61981201171875, -0.513092041015625, -0.4063720703125, -0.299652099609375, -0.19293212890625, -0.086212158203125, 0.0205078125, 0.127227783203125, 0.23394775390625, 0.340667724609375, 0.4473876953125, 0.554107666015625, 0.66082763671875, 0.767547607421875, 0.874267578125, 0.980987548828125, 1.08770751953125, 1.194427490234375, 1.3011474609375, 1.407867431640625, 1.51458740234375, 1.621307373046875, 1.72802734375, 1.834747314453125, 1.94146728515625, 2.048187255859375, 2.1549072265625, 2.261627197265625, 2.36834716796875, 2.475067138671875, 2.581787109375, 2.688507080078125, 2.79522705078125, 2.901947021484375, 3.0086669921875, 3.115386962890625, 3.22210693359375, 3.328826904296875, 3.435546875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 10.0, 4.0, 5.0, 9.0, 8.0, 7.0, 7.0, 13.0, 36.0, 202.0, 431.0, 143.0, 23.0, 10.0, 6.0, 6.0, 7.0, 5.0, 7.0, 4.0, 3.0, 6.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.203125, -0.19673728942871094, -0.19034957885742188, -0.1839618682861328, -0.17757415771484375, -0.1711864471435547, -0.16479873657226562, -0.15841102600097656, -0.1520233154296875, -0.14563560485839844, -0.13924789428710938, -0.1328601837158203, -0.12647247314453125, -0.12008476257324219, -0.11369705200195312, -0.10730934143066406, -0.100921630859375, -0.09453392028808594, -0.08814620971679688, -0.08175849914550781, -0.07537078857421875, -0.06898307800292969, -0.06259536743164062, -0.05620765686035156, -0.0498199462890625, -0.04343223571777344, -0.037044525146484375, -0.030656814575195312, -0.02426910400390625, -0.017881393432617188, -0.011493682861328125, -0.0051059722900390625, 0.00128173828125, 0.0076694488525390625, 0.014057159423828125, 0.020444869995117188, 0.02683258056640625, 0.03322029113769531, 0.039608001708984375, 0.04599571228027344, 0.0523834228515625, 0.05877113342285156, 0.06515884399414062, 0.07154655456542969, 0.07793426513671875, 0.08432197570800781, 0.09070968627929688, 0.09709739685058594, 0.103485107421875, 0.10987281799316406, 0.11626052856445312, 0.12264823913574219, 0.12903594970703125, 0.1354236602783203, 0.14181137084960938, 0.14819908142089844, 0.1545867919921875, 0.16097450256347656, 0.16736221313476562, 0.1737499237060547, 0.18013763427734375, 0.1865253448486328, 0.19291305541992188, 0.19930076599121094, 0.2056884765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 8.0, 3.0, 6.0, 7.0, 10.0, 9.0, 10.0, 12.0, 32.0, 30.0, 30.0, 38.0, 50.0, 88.0, 151.0, 290.0, 789.0, 7467.0, 4165409.0, 17832.0, 1121.0, 335.0, 174.0, 95.0, 58.0, 43.0, 32.0, 30.0, 28.0, 16.0, 10.0, 11.0, 9.0, 13.0, 4.0, 5.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.740234375, -2.65618896484375, -2.5721435546875, -2.48809814453125, -2.404052734375, -2.32000732421875, -2.2359619140625, -2.15191650390625, -2.06787109375, -1.98382568359375, -1.8997802734375, -1.81573486328125, -1.731689453125, -1.64764404296875, -1.5635986328125, -1.47955322265625, -1.3955078125, -1.31146240234375, -1.2274169921875, -1.14337158203125, -1.059326171875, -0.97528076171875, -0.8912353515625, -0.80718994140625, -0.72314453125, -0.63909912109375, -0.5550537109375, -0.47100830078125, -0.386962890625, -0.30291748046875, -0.2188720703125, -0.13482666015625, -0.05078125, 0.03326416015625, 0.1173095703125, 0.20135498046875, 0.285400390625, 0.36944580078125, 0.4534912109375, 0.53753662109375, 0.62158203125, 0.70562744140625, 0.7896728515625, 0.87371826171875, 0.957763671875, 1.04180908203125, 1.1258544921875, 1.20989990234375, 1.2939453125, 1.37799072265625, 1.4620361328125, 1.54608154296875, 1.630126953125, 1.71417236328125, 1.7982177734375, 1.88226318359375, 1.96630859375, 2.05035400390625, 2.1343994140625, 2.21844482421875, 2.302490234375, 2.38653564453125, 2.4705810546875, 2.55462646484375, 2.638671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 10.0, 4.0, 18.0, 15.0, 21.0, 26.0, 39.0, 113.0, 3408.0, 163.0, 51.0, 27.0, 18.0, 20.0, 17.0, 18.0, 10.0, 6.0, 7.0, 7.0, 4.0, 5.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43505859375, -0.4217109680175781, -0.40836334228515625, -0.3950157165527344, -0.3816680908203125, -0.3683204650878906, -0.35497283935546875, -0.3416252136230469, -0.328277587890625, -0.3149299621582031, -0.30158233642578125, -0.2882347106933594, -0.2748870849609375, -0.2615394592285156, -0.24819183349609375, -0.23484420776367188, -0.22149658203125, -0.20814895629882812, -0.19480133056640625, -0.18145370483398438, -0.1681060791015625, -0.15475845336914062, -0.14141082763671875, -0.12806320190429688, -0.114715576171875, -0.10136795043945312, -0.08802032470703125, -0.07467269897460938, -0.0613250732421875, -0.047977447509765625, -0.03462982177734375, -0.021282196044921875, -0.0079345703125, 0.005413055419921875, 0.01876068115234375, 0.032108306884765625, 0.0454559326171875, 0.058803558349609375, 0.07215118408203125, 0.08549880981445312, 0.098846435546875, 0.11219406127929688, 0.12554168701171875, 0.13888931274414062, 0.1522369384765625, 0.16558456420898438, 0.17893218994140625, 0.19227981567382812, 0.20562744140625, 0.21897506713867188, 0.23232269287109375, 0.24567031860351562, 0.2590179443359375, 0.2723655700683594, 0.28571319580078125, 0.2990608215332031, 0.312408447265625, 0.3257560729980469, 0.33910369873046875, 0.3524513244628906, 0.3657989501953125, 0.3791465759277344, 0.39249420166015625, 0.4058418273925781, 0.419189453125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1008.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.11021900177002, -9.928184509277344, -9.746150970458984, -9.564116477966309, -9.38208293914795, -9.200048446655273, -9.018014907836914, -8.835980415344238, -8.653945922851562, -8.471911430358887, -8.289877891540527, -8.107843399047852, -7.925809860229492, -7.743775367736816, -7.561741352081299, -7.379707336425781, -7.197673797607422, -7.015639781951904, -6.833605766296387, -6.651571750640869, -6.469537734985352, -6.287503242492676, -6.105469226837158, -5.923435211181641, -5.741401195526123, -5.5593671798706055, -5.377333164215088, -5.19529914855957, -5.0132646560668945, -4.831230640411377, -4.649196624755859, -4.467162609100342, -4.285128116607666, -4.103094100952148, -3.921060085296631, -3.739025831222534, -3.5569918155670166, -3.374957799911499, -3.1929235458374023, -3.0108895301818848, -2.828855514526367, -2.6468214988708496, -2.464787483215332, -2.2827532291412354, -2.1007192134857178, -1.9186851978302002, -1.736651062965393, -1.554616928100586, -1.3725829124450684, -1.1905488967895508, -1.0085147619247437, -0.8264806866645813, -0.644446611404419, -0.4624125361442566, -0.28037846088409424, -0.09834432601928711, 0.08368968963623047, 0.2657237648963928, 0.4477578401565552, 0.6297919154167175, 0.8118259906768799, 0.9938600659370422, 1.1758941411972046, 1.3579282760620117, 1.5399622917175293]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 11.0, 9.0, 11.0, 15.0, 26.0, 23.0, 22.0, 58.0, 46.0, 56.0, 84.0, 82.0, 90.0, 72.0, 60.0, 62.0, 57.0, 58.0, 36.0, 20.0, 23.0, 15.0, 12.0, 12.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.842200756072998, -1.7918740510940552, -1.7415473461151123, -1.691220760345459, -1.6408940553665161, -1.5905673503875732, -1.54024076461792, -1.489914059638977, -1.4395873546600342, -1.3892606496810913, -1.3389339447021484, -1.2886073589324951, -1.2382806539535522, -1.1879539489746094, -1.137627363204956, -1.0873006582260132, -1.0369739532470703, -0.9866472482681274, -0.9363206028938293, -0.8859939575195312, -0.8356672525405884, -0.7853405475616455, -0.7350139021873474, -0.6846872568130493, -0.6343605518341064, -0.5840338468551636, -0.5337072014808655, -0.483380526304245, -0.4330538511276245, -0.38272717595100403, -0.33240050077438354, -0.28207382559776306, -0.23174715042114258, -0.1814204752445221, -0.1310938000679016, -0.08076712489128113, -0.030440449714660645, 0.01988622546195984, 0.07021290063858032, 0.1205395758152008, 0.1708662509918213, 0.22119292616844177, 0.27151960134506226, 0.32184627652168274, 0.3721729516983032, 0.4224996268749237, 0.4728263020515442, 0.5231529474258423, 0.5734796524047852, 0.623806357383728, 0.6741330027580261, 0.7244596481323242, 0.7747863531112671, 0.82511305809021, 0.8754397034645081, 0.9257663488388062, 0.976093053817749, 1.026419758796692, 1.0767464637756348, 1.127073049545288, 1.177399754524231, 1.2277264595031738, 1.2780530452728271, 1.32837975025177, 1.378706455230713]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 9.0, 12.0, 15.0, 11.0, 13.0, 25.0, 55.0, 57.0, 89.0, 110.0, 175.0, 223.0, 345.0, 472.0, 727.0, 1022.0, 1781.0, 2836.0, 4424.0, 8353.0, 17511.0, 95486.0, 859232.0, 27887.0, 11604.0, 5898.0, 3532.0, 2329.0, 1353.0, 907.0, 593.0, 416.0, 325.0, 213.0, 138.0, 100.0, 82.0, 52.0, 37.0, 37.0, 15.0, 16.0, 7.0, 11.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5712890625, -0.5535659790039062, -0.5358428955078125, -0.5181198120117188, -0.500396728515625, -0.48267364501953125, -0.4649505615234375, -0.44722747802734375, -0.42950439453125, -0.41178131103515625, -0.3940582275390625, -0.37633514404296875, -0.358612060546875, -0.34088897705078125, -0.3231658935546875, -0.30544281005859375, -0.2877197265625, -0.26999664306640625, -0.2522735595703125, -0.23455047607421875, -0.216827392578125, -0.19910430908203125, -0.1813812255859375, -0.16365814208984375, -0.14593505859375, -0.12821197509765625, -0.1104888916015625, -0.09276580810546875, -0.075042724609375, -0.05731964111328125, -0.0395965576171875, -0.02187347412109375, -0.004150390625, 0.01357269287109375, 0.0312957763671875, 0.04901885986328125, 0.066741943359375, 0.08446502685546875, 0.1021881103515625, 0.11991119384765625, 0.13763427734375, 0.15535736083984375, 0.1730804443359375, 0.19080352783203125, 0.208526611328125, 0.22624969482421875, 0.2439727783203125, 0.26169586181640625, 0.2794189453125, 0.29714202880859375, 0.3148651123046875, 0.33258819580078125, 0.350311279296875, 0.36803436279296875, 0.3857574462890625, 0.40348052978515625, 0.42120361328125, 0.43892669677734375, 0.4566497802734375, 0.47437286376953125, 0.492095947265625, 0.5098190307617188, 0.5275421142578125, 0.5452651977539062, 0.56298828125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 8.0, 8.0, 17.0, 37.0, 217.0, 415.0, 138.0, 24.0, 9.0, 9.0, 5.0, 7.0, 7.0, 6.0, 4.0, 2.0, 7.0, 5.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1986083984375, -0.1923542022705078, -0.18610000610351562, -0.17984580993652344, -0.17359161376953125, -0.16733741760253906, -0.16108322143554688, -0.1548290252685547, -0.1485748291015625, -0.1423206329345703, -0.13606643676757812, -0.12981224060058594, -0.12355804443359375, -0.11730384826660156, -0.11104965209960938, -0.10479545593261719, -0.098541259765625, -0.09228706359863281, -0.08603286743164062, -0.07977867126464844, -0.07352447509765625, -0.06727027893066406, -0.061016082763671875, -0.05476188659667969, -0.0485076904296875, -0.04225349426269531, -0.035999298095703125, -0.029745101928710938, -0.02349090576171875, -0.017236709594726562, -0.010982513427734375, -0.0047283172607421875, 0.00152587890625, 0.0077800750732421875, 0.014034271240234375, 0.020288467407226562, 0.02654266357421875, 0.03279685974121094, 0.039051055908203125, 0.04530525207519531, 0.0515594482421875, 0.05781364440917969, 0.06406784057617188, 0.07032203674316406, 0.07657623291015625, 0.08283042907714844, 0.08908462524414062, 0.09533882141113281, 0.101593017578125, 0.10784721374511719, 0.11410140991210938, 0.12035560607910156, 0.12660980224609375, 0.13286399841308594, 0.13911819458007812, 0.1453723907470703, 0.1516265869140625, 0.1578807830810547, 0.16413497924804688, 0.17038917541503906, 0.17664337158203125, 0.18289756774902344, 0.18915176391601562, 0.1954059600830078, 0.20166015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 13.0, 9.0, 12.0, 13.0, 22.0, 28.0, 28.0, 46.0, 57.0, 42.0, 82.0, 61.0, 75.0, 104.0, 122.0, 111.0, 189.0, 286.0, 494.0, 1143.0, 11719.0, 938550.0, 90484.0, 2688.0, 688.0, 307.0, 189.0, 176.0, 118.0, 131.0, 96.0, 68.0, 67.0, 65.0, 46.0, 44.0, 35.0, 26.0, 24.0, 14.0, 9.0, 11.0, 9.0, 14.0, 9.0, 3.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4296875, -1.3846282958984375, -1.339569091796875, -1.2945098876953125, -1.24945068359375, -1.2043914794921875, -1.159332275390625, -1.1142730712890625, -1.0692138671875, -1.0241546630859375, -0.979095458984375, -0.9340362548828125, -0.88897705078125, -0.8439178466796875, -0.798858642578125, -0.7537994384765625, -0.708740234375, -0.6636810302734375, -0.618621826171875, -0.5735626220703125, -0.52850341796875, -0.4834442138671875, -0.438385009765625, -0.3933258056640625, -0.3482666015625, -0.3032073974609375, -0.258148193359375, -0.2130889892578125, -0.16802978515625, -0.1229705810546875, -0.077911376953125, -0.0328521728515625, 0.01220703125, 0.0572662353515625, 0.102325439453125, 0.1473846435546875, 0.19244384765625, 0.2375030517578125, 0.282562255859375, 0.3276214599609375, 0.3726806640625, 0.4177398681640625, 0.462799072265625, 0.5078582763671875, 0.55291748046875, 0.5979766845703125, 0.643035888671875, 0.6880950927734375, 0.733154296875, 0.7782135009765625, 0.823272705078125, 0.8683319091796875, 0.91339111328125, 0.9584503173828125, 1.003509521484375, 1.0485687255859375, 1.0936279296875, 1.1386871337890625, 1.183746337890625, 1.2288055419921875, 1.27386474609375, 1.3189239501953125, 1.363983154296875, 1.4090423583984375, 1.4541015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 11.0, 8.0, 10.0, 25.0, 15.0, 13.0, 27.0, 14.0, 25.0, 25.0, 34.0, 28.0, 39.0, 46.0, 45.0, 42.0, 46.0, 39.0, 34.0, 43.0, 35.0, 41.0, 39.0, 35.0, 28.0, 26.0, 40.0, 31.0, 22.0, 18.0, 23.0, 14.0, 10.0, 14.0, 11.0, 6.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5678482055664062, -0.5482940673828125, -0.5287399291992188, -0.509185791015625, -0.48963165283203125, -0.4700775146484375, -0.45052337646484375, -0.43096923828125, -0.41141510009765625, -0.3918609619140625, -0.37230682373046875, -0.352752685546875, -0.33319854736328125, -0.3136444091796875, -0.29409027099609375, -0.2745361328125, -0.25498199462890625, -0.2354278564453125, -0.21587371826171875, -0.196319580078125, -0.17676544189453125, -0.1572113037109375, -0.13765716552734375, -0.11810302734375, -0.09854888916015625, -0.0789947509765625, -0.05944061279296875, -0.039886474609375, -0.02033233642578125, -0.0007781982421875, 0.01877593994140625, 0.038330078125, 0.05788421630859375, 0.0774383544921875, 0.09699249267578125, 0.116546630859375, 0.13610076904296875, 0.1556549072265625, 0.17520904541015625, 0.19476318359375, 0.21431732177734375, 0.2338714599609375, 0.25342559814453125, 0.272979736328125, 0.29253387451171875, 0.3120880126953125, 0.33164215087890625, 0.3511962890625, 0.37075042724609375, 0.3903045654296875, 0.40985870361328125, 0.429412841796875, 0.44896697998046875, 0.4685211181640625, 0.48807525634765625, 0.50762939453125, 0.5271835327148438, 0.5467376708984375, 0.5662918090820312, 0.585845947265625, 0.6054000854492188, 0.6249542236328125, 0.6445083618164062, 0.6640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 12.0, 14.0, 17.0, 25.0, 24.0, 30.0, 69.0, 68.0, 113.0, 190.0, 242.0, 471.0, 745.0, 1547.0, 3672.0, 12338.0, 104206.0, 877944.0, 34502.0, 6988.0, 2491.0, 1170.0, 593.0, 352.0, 237.0, 141.0, 98.0, 48.0, 52.0, 33.0, 28.0, 12.0, 13.0, 18.0, 7.0, 2.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007958412170410156, -0.0007686689496040344, -0.0007414966821670532, -0.000714324414730072, -0.0006871521472930908, -0.0006599798798561096, -0.0006328076124191284, -0.0006056353449821472, -0.000578463077545166, -0.0005512908101081848, -0.0005241185426712036, -0.0004969462752342224, -0.0004697740077972412, -0.00044260174036026, -0.0004154294729232788, -0.0003882572054862976, -0.0003610849380493164, -0.0003339126706123352, -0.000306740403175354, -0.0002795681357383728, -0.0002523958683013916, -0.0002252236008644104, -0.0001980513334274292, -0.000170879065990448, -0.0001437067985534668, -0.0001165345311164856, -8.93622636795044e-05, -6.21899962425232e-05, -3.501772880554199e-05, -7.845461368560791e-06, 1.932680606842041e-05, 4.649907350540161e-05, 7.367134094238281e-05, 0.00010084360837936401, 0.00012801587581634521, 0.00015518814325332642, 0.00018236041069030762, 0.00020953267812728882, 0.00023670494556427002, 0.0002638772130012512, 0.0002910494804382324, 0.0003182217478752136, 0.0003453940153121948, 0.000372566282749176, 0.0003997385501861572, 0.00042691081762313843, 0.00045408308506011963, 0.00048125535249710083, 0.000508427619934082, 0.0005355998873710632, 0.0005627721548080444, 0.0005899444222450256, 0.0006171166896820068, 0.000644288957118988, 0.0006714612245559692, 0.0006986334919929504, 0.0007258057594299316, 0.0007529780268669128, 0.000780150294303894, 0.0008073225617408752, 0.0008344948291778564, 0.0008616670966148376, 0.0008888393640518188, 0.0009160116314888, 0.0009431838989257812]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 6.0, 1.0, 3.0, 8.0, 5.0, 9.0, 12.0, 9.0, 23.0, 13.0, 27.0, 14.0, 49.0, 47.0, 28.0, 63.0, 31.0, 71.0, 34.0, 62.0, 54.0, 38.0, 47.0, 29.0, 65.0, 22.0, 35.0, 55.0, 18.0, 36.0, 13.0, 17.0, 16.0, 2.0, 10.0, 4.0, 4.0, 3.0, 7.0, 8.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9802322387695312e-06, -2.886168658733368e-06, -2.7921050786972046e-06, -2.6980414986610413e-06, -2.603977918624878e-06, -2.5099143385887146e-06, -2.4158507585525513e-06, -2.321787178516388e-06, -2.2277235984802246e-06, -2.1336600184440613e-06, -2.039596438407898e-06, -1.9455328583717346e-06, -1.8514692783355713e-06, -1.757405698299408e-06, -1.6633421182632446e-06, -1.5692785382270813e-06, -1.475214958190918e-06, -1.3811513781547546e-06, -1.2870877981185913e-06, -1.193024218082428e-06, -1.0989606380462646e-06, -1.0048970580101013e-06, -9.10833477973938e-07, -8.167698979377747e-07, -7.227063179016113e-07, -6.28642737865448e-07, -5.345791578292847e-07, -4.4051557779312134e-07, -3.46451997756958e-07, -2.523884177207947e-07, -1.5832483768463135e-07, -6.426125764846802e-08, 2.9802322387695312e-08, 1.2386590242385864e-07, 2.1792948246002197e-07, 3.119930624961853e-07, 4.0605664253234863e-07, 5.00120222568512e-07, 5.941838026046753e-07, 6.882473826408386e-07, 7.82310962677002e-07, 8.763745427131653e-07, 9.704381227493286e-07, 1.064501702785492e-06, 1.1585652828216553e-06, 1.2526288628578186e-06, 1.346692442893982e-06, 1.4407560229301453e-06, 1.5348196029663086e-06, 1.628883183002472e-06, 1.7229467630386353e-06, 1.8170103430747986e-06, 1.911073923110962e-06, 2.0051375031471252e-06, 2.0992010831832886e-06, 2.193264663219452e-06, 2.2873282432556152e-06, 2.3813918232917786e-06, 2.475455403327942e-06, 2.5695189833641052e-06, 2.6635825634002686e-06, 2.757646143436432e-06, 2.8517097234725952e-06, 2.9457733035087585e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 20.0, 26.0, 66.0, 117.0, 240.0, 629.0, 9164.0, 1035788.0, 1711.0, 382.0, 166.0, 89.0, 50.0, 30.0, 12.0, 10.0, 6.0, 4.0, 0.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003620147705078125, -0.0035080015659332275, -0.00339585542678833, -0.0032837092876434326, -0.003171563148498535, -0.0030594170093536377, -0.0029472708702087402, -0.0028351247310638428, -0.0027229785919189453, -0.002610832452774048, -0.0024986863136291504, -0.002386540174484253, -0.0022743940353393555, -0.002162247896194458, -0.0020501017570495605, -0.001937955617904663, -0.0018258094787597656, -0.0017136633396148682, -0.0016015172004699707, -0.0014893710613250732, -0.0013772249221801758, -0.0012650787830352783, -0.0011529326438903809, -0.0010407865047454834, -0.0009286403656005859, -0.0008164942264556885, -0.000704348087310791, -0.0005922019481658936, -0.0004800558090209961, -0.00036790966987609863, -0.00025576353073120117, -0.0001436173915863037, -3.147125244140625e-05, 8.067488670349121e-05, 0.00019282102584838867, 0.00030496716499328613, 0.0004171133041381836, 0.0005292594432830811, 0.0006414055824279785, 0.000753551721572876, 0.0008656978607177734, 0.000977843999862671, 0.0010899901390075684, 0.0012021362781524658, 0.0013142824172973633, 0.0014264285564422607, 0.0015385746955871582, 0.0016507208347320557, 0.0017628669738769531, 0.0018750131130218506, 0.001987159252166748, 0.0020993053913116455, 0.002211451530456543, 0.0023235976696014404, 0.002435743808746338, 0.0025478899478912354, 0.002660036087036133, 0.0027721822261810303, 0.0028843283653259277, 0.002996474504470825, 0.0031086206436157227, 0.00322076678276062, 0.0033329129219055176, 0.003445059061050415, 0.0035572052001953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 10.0, 21.0, 28.0, 63.0, 90.0, 123.0, 192.0, 164.0, 118.0, 73.0, 41.0, 29.0, 15.0, 9.0, 10.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0016527175903320312, -0.0016090571880340576, -0.001565396785736084, -0.0015217363834381104, -0.0014780759811401367, -0.001434415578842163, -0.0013907551765441895, -0.0013470947742462158, -0.0013034343719482422, -0.0012597739696502686, -0.001216113567352295, -0.0011724531650543213, -0.0011287927627563477, -0.001085132360458374, -0.0010414719581604004, -0.0009978115558624268, -0.0009541511535644531, -0.0009104907512664795, -0.0008668303489685059, -0.0008231699466705322, -0.0007795095443725586, -0.000735849142074585, -0.0006921887397766113, -0.0006485283374786377, -0.0006048679351806641, -0.0005612075328826904, -0.0005175471305847168, -0.00047388672828674316, -0.00043022632598876953, -0.0003865659236907959, -0.00034290552139282227, -0.00029924511909484863, -0.000255584716796875, -0.00021192431449890137, -0.00016826391220092773, -0.0001246035099029541, -8.094310760498047e-05, -3.7282705307006836e-05, 6.377696990966797e-06, 5.003809928894043e-05, 9.369850158691406e-05, 0.0001373589038848877, 0.00018101930618286133, 0.00022467970848083496, 0.0002683401107788086, 0.0003120005130767822, 0.00035566091537475586, 0.0003993213176727295, 0.0004429817199707031, 0.00048664212226867676, 0.0005303025245666504, 0.000573962926864624, 0.0006176233291625977, 0.0006612837314605713, 0.0007049441337585449, 0.0007486045360565186, 0.0007922649383544922, 0.0008359253406524658, 0.0008795857429504395, 0.0009232461452484131, 0.0009669065475463867, 0.0010105669498443604, 0.001054227352142334, 0.0010978877544403076, 0.0011415481567382812]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 17.0, 277.0, 677.0, 36.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7332582473754883, -1.5620062351226807, -1.390754222869873, -1.2195022106170654, -1.0482501983642578, -0.8769981265068054, -0.705746054649353, -0.5344940423965454, -0.3632420301437378, -0.19199000298976898, -0.02073797583580017, 0.15051406621932983, 0.32176607847213745, 0.49301809072494507, 0.6642701625823975, 0.8355221748352051, 1.0067741870880127, 1.1780261993408203, 1.349278211593628, 1.5205302238464355, 1.6917822360992432, 1.8630342483520508, 2.0342864990234375, 2.205538272857666, 2.3767905235290527, 2.5480425357818604, 2.719294548034668, 2.8905465602874756, 3.061798572540283, 3.233050584793091, 3.4043025970458984, 3.575554847717285, 3.7468066215515137, 3.9180586338043213, 4.089310646057129, 4.260562896728516, 4.431814670562744, 4.603066921234131, 4.774318695068359, 4.945570945739746, 5.116822719573975, 5.288074970245361, 5.45932674407959, 5.630578994750977, 5.801830768585205, 5.973083019256592, 6.14433479309082, 6.315587043762207, 6.486839294433594, 6.6580915451049805, 6.829343318939209, 7.000595569610596, 7.171847343444824, 7.343099594116211, 7.5143513679504395, 7.685603618621826, 7.856855392456055, 8.028107643127441, 8.199359893798828, 8.370611190795898, 8.541863441467285, 8.713115692138672, 8.884367942810059, 9.055619239807129, 9.226871490478516]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 11.0, 9.0, 16.0, 22.0, 6.0, 31.0, 37.0, 34.0, 49.0, 52.0, 51.0, 48.0, 61.0, 64.0, 64.0, 72.0, 63.0, 48.0, 38.0, 45.0, 37.0, 35.0, 24.0, 19.0, 20.0, 18.0, 5.0, 8.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.99738883972168, -4.811003684997559, -4.6246185302734375, -4.438233375549316, -4.251848220825195, -4.065463066101074, -3.879077911376953, -3.692692756652832, -3.506307601928711, -3.31992244720459, -3.1335372924804688, -2.9471521377563477, -2.7607669830322266, -2.5743818283081055, -2.3879966735839844, -2.2016115188598633, -2.015226364135742, -1.828841209411621, -1.6424560546875, -1.456070899963379, -1.2696857452392578, -1.0833005905151367, -0.8969154357910156, -0.7105302810668945, -0.5241451263427734, -0.33775997161865234, -0.15137481689453125, 0.035010337829589844, 0.22139549255371094, 0.40778064727783203, 0.5941658020019531, 0.7805509567260742, 0.9669361114501953, 1.1533212661743164, 1.3397064208984375, 1.5260915756225586, 1.7124767303466797, 1.8988618850708008, 2.085247039794922, 2.271632194519043, 2.458017349243164, 2.644402503967285, 2.8307876586914062, 3.0171728134155273, 3.2035579681396484, 3.3899431228637695, 3.5763282775878906, 3.7627134323120117, 3.949098587036133, 4.135483741760254, 4.321868896484375, 4.508254051208496, 4.694639205932617, 4.881024360656738, 5.067409515380859, 5.2537946701049805, 5.440179824829102, 5.626564979553223, 5.812950134277344, 5.999335289001465, 6.185720443725586, 6.372105598449707, 6.558490753173828, 6.744875907897949, 6.93126106262207]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 9.0, 6.0, 6.0, 8.0, 11.0, 20.0, 19.0, 37.0, 46.0, 60.0, 92.0, 106.0, 164.0, 268.0, 471.0, 1075.0, 16298.0, 4164957.0, 7739.0, 1041.0, 543.0, 323.0, 229.0, 185.0, 121.0, 99.0, 70.0, 60.0, 41.0, 35.0, 22.0, 19.0, 14.0, 7.0, 13.0, 10.0, 11.0, 10.0, 4.0, 7.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.83642578125, -0.809844970703125, -0.78326416015625, -0.756683349609375, -0.7301025390625, -0.703521728515625, -0.67694091796875, -0.650360107421875, -0.623779296875, -0.597198486328125, -0.57061767578125, -0.544036865234375, -0.5174560546875, -0.490875244140625, -0.46429443359375, -0.437713623046875, -0.4111328125, -0.384552001953125, -0.35797119140625, -0.331390380859375, -0.3048095703125, -0.278228759765625, -0.25164794921875, -0.225067138671875, -0.198486328125, -0.171905517578125, -0.14532470703125, -0.118743896484375, -0.0921630859375, -0.065582275390625, -0.03900146484375, -0.012420654296875, 0.01416015625, 0.040740966796875, 0.06732177734375, 0.093902587890625, 0.1204833984375, 0.147064208984375, 0.17364501953125, 0.200225830078125, 0.226806640625, 0.253387451171875, 0.27996826171875, 0.306549072265625, 0.3331298828125, 0.359710693359375, 0.38629150390625, 0.412872314453125, 0.439453125, 0.466033935546875, 0.49261474609375, 0.519195556640625, 0.5457763671875, 0.572357177734375, 0.59893798828125, 0.625518798828125, 0.652099609375, 0.678680419921875, 0.70526123046875, 0.731842041015625, 0.7584228515625, 0.785003662109375, 0.81158447265625, 0.838165283203125, 0.86474609375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 6.0, 6.0, 8.0, 4.0, 9.0, 5.0, 9.0, 10.0, 19.0, 99.0, 297.0, 326.0, 83.0, 26.0, 6.0, 5.0, 6.0, 10.0, 7.0, 4.0, 2.0, 6.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1954345703125, -0.18922042846679688, -0.18300628662109375, -0.17679214477539062, -0.1705780029296875, -0.16436386108398438, -0.15814971923828125, -0.15193557739257812, -0.145721435546875, -0.13950729370117188, -0.13329315185546875, -0.12707901000976562, -0.1208648681640625, -0.11465072631835938, -0.10843658447265625, -0.10222244262695312, -0.09600830078125, -0.08979415893554688, -0.08358001708984375, -0.07736587524414062, -0.0711517333984375, -0.06493759155273438, -0.05872344970703125, -0.052509307861328125, -0.046295166015625, -0.040081024169921875, -0.03386688232421875, -0.027652740478515625, -0.0214385986328125, -0.015224456787109375, -0.00901031494140625, -0.002796173095703125, 0.00341796875, 0.009632110595703125, 0.01584625244140625, 0.022060394287109375, 0.0282745361328125, 0.034488677978515625, 0.04070281982421875, 0.046916961669921875, 0.053131103515625, 0.059345245361328125, 0.06555938720703125, 0.07177352905273438, 0.0779876708984375, 0.08420181274414062, 0.09041595458984375, 0.09663009643554688, 0.10284423828125, 0.10905838012695312, 0.11527252197265625, 0.12148666381835938, 0.1277008056640625, 0.13391494750976562, 0.14012908935546875, 0.14634323120117188, 0.152557373046875, 0.15877151489257812, 0.16498565673828125, 0.17119979858398438, 0.1774139404296875, 0.18362808227539062, 0.18984222412109375, 0.19605636596679688, 0.2022705078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 7.0, 4.0, 4.0, 8.0, 11.0, 4.0, 6.0, 13.0, 16.0, 24.0, 37.0, 53.0, 84.0, 193.0, 436.0, 3351.0, 4153977.0, 34196.0, 1215.0, 276.0, 131.0, 61.0, 41.0, 18.0, 22.0, 15.0, 15.0, 14.0, 12.0, 8.0, 8.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.357421875, -1.3160247802734375, -1.274627685546875, -1.2332305908203125, -1.19183349609375, -1.1504364013671875, -1.109039306640625, -1.0676422119140625, -1.0262451171875, -0.9848480224609375, -0.943450927734375, -0.9020538330078125, -0.86065673828125, -0.8192596435546875, -0.777862548828125, -0.7364654541015625, -0.695068359375, -0.6536712646484375, -0.612274169921875, -0.5708770751953125, -0.52947998046875, -0.4880828857421875, -0.446685791015625, -0.4052886962890625, -0.3638916015625, -0.3224945068359375, -0.281097412109375, -0.2397003173828125, -0.19830322265625, -0.1569061279296875, -0.115509033203125, -0.0741119384765625, -0.03271484375, 0.0086822509765625, 0.050079345703125, 0.0914764404296875, 0.13287353515625, 0.1742706298828125, 0.215667724609375, 0.2570648193359375, 0.2984619140625, 0.3398590087890625, 0.381256103515625, 0.4226531982421875, 0.46405029296875, 0.5054473876953125, 0.546844482421875, 0.5882415771484375, 0.629638671875, 0.6710357666015625, 0.712432861328125, 0.7538299560546875, 0.79522705078125, 0.8366241455078125, 0.878021240234375, 0.9194183349609375, 0.9608154296875, 1.0022125244140625, 1.043609619140625, 1.0850067138671875, 1.12640380859375, 1.1678009033203125, 1.209197998046875, 1.2505950927734375, 1.2919921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 12.0, 10.0, 19.0, 34.0, 54.0, 225.0, 3441.0, 123.0, 37.0, 21.0, 16.0, 12.0, 13.0, 4.0, 9.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.2246112823486328, -0.21667861938476562, -0.20874595642089844, -0.20081329345703125, -0.19288063049316406, -0.18494796752929688, -0.1770153045654297, -0.1690826416015625, -0.1611499786376953, -0.15321731567382812, -0.14528465270996094, -0.13735198974609375, -0.12941932678222656, -0.12148666381835938, -0.11355400085449219, -0.105621337890625, -0.09768867492675781, -0.08975601196289062, -0.08182334899902344, -0.07389068603515625, -0.06595802307128906, -0.058025360107421875, -0.05009269714355469, -0.0421600341796875, -0.03422737121582031, -0.026294708251953125, -0.018362045288085938, -0.01042938232421875, -0.0024967193603515625, 0.005435943603515625, 0.013368606567382812, 0.02130126953125, 0.029233932495117188, 0.037166595458984375, 0.04509925842285156, 0.05303192138671875, 0.06096458435058594, 0.06889724731445312, 0.07682991027832031, 0.0847625732421875, 0.09269523620605469, 0.10062789916992188, 0.10856056213378906, 0.11649322509765625, 0.12442588806152344, 0.13235855102539062, 0.1402912139892578, 0.148223876953125, 0.1561565399169922, 0.16408920288085938, 0.17202186584472656, 0.17995452880859375, 0.18788719177246094, 0.19581985473632812, 0.2037525177001953, 0.2116851806640625, 0.2196178436279297, 0.22755050659179688, 0.23548316955566406, 0.24341583251953125, 0.25134849548339844, 0.2592811584472656, 0.2672138214111328, 0.275146484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1011.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31766414642334, -6.203608989715576, -6.089553356170654, -5.975498199462891, -5.861443042755127, -5.747387886047363, -5.633332252502441, -5.519277095794678, -5.405221939086914, -5.29116678237915, -5.1771111488342285, -5.063055992126465, -4.949000835418701, -4.8349456787109375, -4.720890045166016, -4.606834888458252, -4.49277925491333, -4.378724098205566, -4.2646684646606445, -4.150613307952881, -4.036558151245117, -3.9225027561187744, -3.8084473609924316, -3.694392204284668, -3.5803370475769043, -3.4662816524505615, -3.352226495742798, -3.238171100616455, -3.1241159439086914, -3.0100605487823486, -2.896005153656006, -2.781949996948242, -2.6678946018218994, -2.5538392066955566, -2.439784049987793, -2.32572865486145, -2.2116734981536865, -2.0976181030273438, -1.9835628271102905, -1.8695075511932373, -1.7554521560668945, -1.6413968801498413, -1.527341604232788, -1.4132862091064453, -1.299230933189392, -1.1851756572723389, -1.0711203813552856, -0.9570650458335876, -0.8430097699165344, -0.7289544939994812, -0.6148991584777832, -0.50084388256073, -0.38678857684135437, -0.27273327112197876, -0.15867799520492554, -0.04462265968322754, 0.06943261623382568, 0.1834879219532013, 0.2975432276725769, 0.4115985035896301, 0.5256538391113281, 0.6397091150283813, 0.7537643909454346, 0.8678197264671326, 0.9818750023841858]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 4.0, 7.0, 15.0, 12.0, 14.0, 20.0, 26.0, 23.0, 38.0, 39.0, 47.0, 46.0, 53.0, 41.0, 52.0, 47.0, 41.0, 55.0, 49.0, 44.0, 35.0, 42.0, 34.0, 25.0, 25.0, 26.0, 32.0, 17.0, 8.0, 14.0, 10.0, 9.0, 7.0, 8.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.5576825737953186, -0.5419741868972778, -0.5262658596038818, -0.5105574727058411, -0.4948490858078003, -0.4791407287120819, -0.4634323716163635, -0.44772398471832275, -0.43201562762260437, -0.416307270526886, -0.4005988836288452, -0.38489052653312683, -0.36918216943740845, -0.3534737825393677, -0.3377654254436493, -0.3220570683479309, -0.30634868144989014, -0.29064032435417175, -0.274931937456131, -0.2592235803604126, -0.24351520836353302, -0.22780683636665344, -0.21209847927093506, -0.19639010727405548, -0.1806817352771759, -0.16497336328029633, -0.14926499128341675, -0.13355663418769836, -0.11784826219081879, -0.10213989019393921, -0.08643152564764023, -0.07072316110134125, -0.055014729499816895, -0.039306361228227615, -0.023597992956638336, -0.007889624685049057, 0.007818743586540222, 0.0235271155834198, 0.03923548012971878, 0.05494384467601776, 0.07065221667289734, 0.08636058866977692, 0.1020689532160759, 0.11777731776237488, 0.13348568975925446, 0.14919406175613403, 0.16490241885185242, 0.180610790848732, 0.19631916284561157, 0.21202753484249115, 0.22773590683937073, 0.2434442639350891, 0.2591526508331299, 0.27486100792884827, 0.29056936502456665, 0.3062777519226074, 0.3219861090183258, 0.3376944661140442, 0.35340285301208496, 0.36911121010780334, 0.38481956720352173, 0.4005279541015625, 0.4162363111972809, 0.43194466829299927, 0.44765305519104004]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 14.0, 21.0, 32.0, 33.0, 51.0, 81.0, 91.0, 155.0, 210.0, 261.0, 370.0, 574.0, 760.0, 1172.0, 1833.0, 2736.0, 4564.0, 8147.0, 16817.0, 104202.0, 851058.0, 28221.0, 10773.0, 5924.0, 3524.0, 2255.0, 1475.0, 975.0, 688.0, 440.0, 322.0, 217.0, 165.0, 97.0, 80.0, 55.0, 43.0, 34.0, 14.0, 9.0, 11.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.396484375, -0.3837890625, -0.37109375, -0.3583984375, -0.345703125, -0.3330078125, -0.3203125, -0.3076171875, -0.294921875, -0.2822265625, -0.26953125, -0.2568359375, -0.244140625, -0.2314453125, -0.21875, -0.2060546875, -0.193359375, -0.1806640625, -0.16796875, -0.1552734375, -0.142578125, -0.1298828125, -0.1171875, -0.1044921875, -0.091796875, -0.0791015625, -0.06640625, -0.0537109375, -0.041015625, -0.0283203125, -0.015625, -0.0029296875, 0.009765625, 0.0224609375, 0.03515625, 0.0478515625, 0.060546875, 0.0732421875, 0.0859375, 0.0986328125, 0.111328125, 0.1240234375, 0.13671875, 0.1494140625, 0.162109375, 0.1748046875, 0.1875, 0.2001953125, 0.212890625, 0.2255859375, 0.23828125, 0.2509765625, 0.263671875, 0.2763671875, 0.2890625, 0.3017578125, 0.314453125, 0.3271484375, 0.33984375, 0.3525390625, 0.365234375, 0.3779296875, 0.390625, 0.4033203125, 0.416015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 7.0, 4.0, 7.0, 7.0, 7.0, 5.0, 9.0, 12.0, 23.0, 120.0, 344.0, 281.0, 57.0, 23.0, 6.0, 6.0, 6.0, 9.0, 6.0, 4.0, 4.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.19287109375, -0.18669891357421875, -0.1805267333984375, -0.17435455322265625, -0.168182373046875, -0.16201019287109375, -0.1558380126953125, -0.14966583251953125, -0.14349365234375, -0.13732147216796875, -0.1311492919921875, -0.12497711181640625, -0.118804931640625, -0.11263275146484375, -0.1064605712890625, -0.10028839111328125, -0.0941162109375, -0.08794403076171875, -0.0817718505859375, -0.07559967041015625, -0.069427490234375, -0.06325531005859375, -0.0570831298828125, -0.05091094970703125, -0.04473876953125, -0.03856658935546875, -0.0323944091796875, -0.02622222900390625, -0.020050048828125, -0.01387786865234375, -0.0077056884765625, -0.00153350830078125, 0.004638671875, 0.01081085205078125, 0.0169830322265625, 0.02315521240234375, 0.029327392578125, 0.03549957275390625, 0.0416717529296875, 0.04784393310546875, 0.05401611328125, 0.06018829345703125, 0.0663604736328125, 0.07253265380859375, 0.078704833984375, 0.08487701416015625, 0.0910491943359375, 0.09722137451171875, 0.1033935546875, 0.10956573486328125, 0.1157379150390625, 0.12191009521484375, 0.128082275390625, 0.13425445556640625, 0.1404266357421875, 0.14659881591796875, 0.15277099609375, 0.15894317626953125, 0.1651153564453125, 0.17128753662109375, 0.177459716796875, 0.18363189697265625, 0.1898040771484375, 0.19597625732421875, 0.2021484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 7.0, 9.0, 6.0, 20.0, 24.0, 36.0, 36.0, 43.0, 68.0, 79.0, 80.0, 134.0, 114.0, 173.0, 219.0, 305.0, 646.0, 1733.0, 23179.0, 996014.0, 21872.0, 1743.0, 615.0, 331.0, 208.0, 157.0, 154.0, 102.0, 99.0, 85.0, 53.0, 56.0, 37.0, 24.0, 23.0, 15.0, 15.0, 8.0, 8.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.193359375, -1.1566314697265625, -1.119903564453125, -1.0831756591796875, -1.04644775390625, -1.0097198486328125, -0.972991943359375, -0.9362640380859375, -0.8995361328125, -0.8628082275390625, -0.826080322265625, -0.7893524169921875, -0.75262451171875, -0.7158966064453125, -0.679168701171875, -0.6424407958984375, -0.605712890625, -0.5689849853515625, -0.532257080078125, -0.4955291748046875, -0.45880126953125, -0.4220733642578125, -0.385345458984375, -0.3486175537109375, -0.3118896484375, -0.2751617431640625, -0.238433837890625, -0.2017059326171875, -0.16497802734375, -0.1282501220703125, -0.091522216796875, -0.0547943115234375, -0.01806640625, 0.0186614990234375, 0.055389404296875, 0.0921173095703125, 0.12884521484375, 0.1655731201171875, 0.202301025390625, 0.2390289306640625, 0.2757568359375, 0.3124847412109375, 0.349212646484375, 0.3859405517578125, 0.42266845703125, 0.4593963623046875, 0.496124267578125, 0.5328521728515625, 0.569580078125, 0.6063079833984375, 0.643035888671875, 0.6797637939453125, 0.71649169921875, 0.7532196044921875, 0.789947509765625, 0.8266754150390625, 0.8634033203125, 0.9001312255859375, 0.936859130859375, 0.9735870361328125, 1.01031494140625, 1.0470428466796875, 1.083770751953125, 1.1204986572265625, 1.1572265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 3.0, 10.0, 12.0, 15.0, 19.0, 13.0, 22.0, 28.0, 22.0, 42.0, 21.0, 28.0, 33.0, 45.0, 51.0, 38.0, 47.0, 51.0, 45.0, 50.0, 53.0, 36.0, 34.0, 51.0, 33.0, 26.0, 30.0, 34.0, 21.0, 19.0, 15.0, 10.0, 14.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67822265625, -0.6573486328125, -0.636474609375, -0.6156005859375, -0.5947265625, -0.5738525390625, -0.552978515625, -0.5321044921875, -0.51123046875, -0.4903564453125, -0.469482421875, -0.4486083984375, -0.427734375, -0.4068603515625, -0.385986328125, -0.3651123046875, -0.34423828125, -0.3233642578125, -0.302490234375, -0.2816162109375, -0.2607421875, -0.2398681640625, -0.218994140625, -0.1981201171875, -0.17724609375, -0.1563720703125, -0.135498046875, -0.1146240234375, -0.09375, -0.0728759765625, -0.052001953125, -0.0311279296875, -0.01025390625, 0.0106201171875, 0.031494140625, 0.0523681640625, 0.0732421875, 0.0941162109375, 0.114990234375, 0.1358642578125, 0.15673828125, 0.1776123046875, 0.198486328125, 0.2193603515625, 0.240234375, 0.2611083984375, 0.281982421875, 0.3028564453125, 0.32373046875, 0.3446044921875, 0.365478515625, 0.3863525390625, 0.4072265625, 0.4281005859375, 0.448974609375, 0.4698486328125, 0.49072265625, 0.5115966796875, 0.532470703125, 0.5533447265625, 0.57421875, 0.5950927734375, 0.615966796875, 0.6368408203125, 0.65771484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 12.0, 18.0, 33.0, 57.0, 86.0, 146.0, 270.0, 621.0, 1413.0, 4366.0, 26080.0, 959211.0, 47417.0, 5608.0, 1686.0, 738.0, 322.0, 162.0, 96.0, 67.0, 40.0, 21.0, 15.0, 10.0, 5.0, 6.0, 4.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009069442749023438, -0.0008821636438369751, -0.0008573830127716064, -0.0008326023817062378, -0.0008078217506408691, -0.0007830411195755005, -0.0007582604885101318, -0.0007334798574447632, -0.0007086992263793945, -0.0006839185953140259, -0.0006591379642486572, -0.0006343573331832886, -0.0006095767021179199, -0.0005847960710525513, -0.0005600154399871826, -0.000535234808921814, -0.0005104541778564453, -0.00048567354679107666, -0.000460892915725708, -0.00043611228466033936, -0.0004113316535949707, -0.00038655102252960205, -0.0003617703914642334, -0.00033698976039886475, -0.0003122091293334961, -0.00028742849826812744, -0.0002626478672027588, -0.00023786723613739014, -0.00021308660507202148, -0.00018830597400665283, -0.00016352534294128418, -0.00013874471187591553, -0.00011396408081054688, -8.918344974517822e-05, -6.440281867980957e-05, -3.962218761444092e-05, -1.4841556549072266e-05, 9.939074516296387e-06, 3.471970558166504e-05, 5.950033664703369e-05, 8.428096771240234e-05, 0.000109061598777771, 0.00013384222984313965, 0.0001586228609085083, 0.00018340349197387695, 0.0002081841230392456, 0.00023296475410461426, 0.0002577453851699829, 0.00028252601623535156, 0.0003073066473007202, 0.00033208727836608887, 0.0003568679094314575, 0.00038164854049682617, 0.0004064291715621948, 0.0004312098026275635, 0.00045599043369293213, 0.0004807710647583008, 0.0005055516958236694, 0.0005303323268890381, 0.0005551129579544067, 0.0005798935890197754, 0.000604674220085144, 0.0006294548511505127, 0.0006542354822158813, 0.00067901611328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 6.0, 11.0, 6.0, 18.0, 14.0, 22.0, 21.0, 44.0, 29.0, 32.0, 43.0, 63.0, 57.0, 45.0, 70.0, 73.0, 47.0, 65.0, 39.0, 85.0, 31.0, 38.0, 35.0, 24.0, 29.0, 16.0, 7.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.6209821701049805e-06, -3.4868717193603516e-06, -3.3527612686157227e-06, -3.2186508178710938e-06, -3.084540367126465e-06, -2.950429916381836e-06, -2.816319465637207e-06, -2.682209014892578e-06, -2.5480985641479492e-06, -2.4139881134033203e-06, -2.2798776626586914e-06, -2.1457672119140625e-06, -2.0116567611694336e-06, -1.8775463104248047e-06, -1.7434358596801758e-06, -1.6093254089355469e-06, -1.475214958190918e-06, -1.341104507446289e-06, -1.2069940567016602e-06, -1.0728836059570312e-06, -9.387731552124023e-07, -8.046627044677734e-07, -6.705522537231445e-07, -5.364418029785156e-07, -4.023313522338867e-07, -2.682209014892578e-07, -1.341104507446289e-07, 0.0, 1.341104507446289e-07, 2.682209014892578e-07, 4.023313522338867e-07, 5.364418029785156e-07, 6.705522537231445e-07, 8.046627044677734e-07, 9.387731552124023e-07, 1.0728836059570312e-06, 1.2069940567016602e-06, 1.341104507446289e-06, 1.475214958190918e-06, 1.6093254089355469e-06, 1.7434358596801758e-06, 1.8775463104248047e-06, 2.0116567611694336e-06, 2.1457672119140625e-06, 2.2798776626586914e-06, 2.4139881134033203e-06, 2.5480985641479492e-06, 2.682209014892578e-06, 2.816319465637207e-06, 2.950429916381836e-06, 3.084540367126465e-06, 3.2186508178710938e-06, 3.3527612686157227e-06, 3.4868717193603516e-06, 3.6209821701049805e-06, 3.7550926208496094e-06, 3.889203071594238e-06, 4.023313522338867e-06, 4.157423973083496e-06, 4.291534423828125e-06, 4.425644874572754e-06, 4.559755325317383e-06, 4.693865776062012e-06, 4.827976226806641e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 4.0, 5.0, 4.0, 7.0, 15.0, 7.0, 19.0, 19.0, 46.0, 59.0, 139.0, 284.0, 732.0, 7373.0, 1033433.0, 5142.0, 665.0, 245.0, 125.0, 80.0, 29.0, 26.0, 15.0, 10.0, 6.0, 8.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0018491744995117188, -0.001793891191482544, -0.0017386078834533691, -0.0016833245754241943, -0.0016280412673950195, -0.0015727579593658447, -0.00151747465133667, -0.0014621913433074951, -0.0014069080352783203, -0.0013516247272491455, -0.0012963414192199707, -0.001241058111190796, -0.001185774803161621, -0.0011304914951324463, -0.0010752081871032715, -0.0010199248790740967, -0.0009646415710449219, -0.0009093582630157471, -0.0008540749549865723, -0.0007987916469573975, -0.0007435083389282227, -0.0006882250308990479, -0.000632941722869873, -0.0005776584148406982, -0.0005223751068115234, -0.00046709179878234863, -0.00041180849075317383, -0.000356525182723999, -0.0003012418746948242, -0.0002459585666656494, -0.0001906752586364746, -0.0001353919506072998, -8.0108642578125e-05, -2.4825334548950195e-05, 3.045797348022461e-05, 8.574128150939941e-05, 0.00014102458953857422, 0.00019630789756774902, 0.00025159120559692383, 0.00030687451362609863, 0.00036215782165527344, 0.00041744112968444824, 0.00047272443771362305, 0.0005280077457427979, 0.0005832910537719727, 0.0006385743618011475, 0.0006938576698303223, 0.0007491409778594971, 0.0008044242858886719, 0.0008597075939178467, 0.0009149909019470215, 0.0009702742099761963, 0.001025557518005371, 0.001080840826034546, 0.0011361241340637207, 0.0011914074420928955, 0.0012466907501220703, 0.0013019740581512451, 0.00135725736618042, 0.0014125406742095947, 0.0014678239822387695, 0.0015231072902679443, 0.0015783905982971191, 0.001633673906326294, 0.0016889572143554688]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 20.0, 29.0, 54.0, 84.0, 125.0, 191.0, 175.0, 111.0, 77.0, 33.0, 28.0, 13.0, 12.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010519027709960938, -0.0010208189487457275, -0.0009897351264953613, -0.0009586513042449951, -0.0009275674819946289, -0.0008964836597442627, -0.0008653998374938965, -0.0008343160152435303, -0.0008032321929931641, -0.0007721483707427979, -0.0007410645484924316, -0.0007099807262420654, -0.0006788969039916992, -0.000647813081741333, -0.0006167292594909668, -0.0005856454372406006, -0.0005545616149902344, -0.0005234777927398682, -0.000492393970489502, -0.00046131014823913574, -0.00043022632598876953, -0.0003991425037384033, -0.0003680586814880371, -0.0003369748592376709, -0.0003058910369873047, -0.0002748072147369385, -0.00024372339248657227, -0.00021263957023620605, -0.00018155574798583984, -0.00015047192573547363, -0.00011938810348510742, -8.830428123474121e-05, -5.7220458984375e-05, -2.613663673400879e-05, 4.947185516357422e-06, 3.603100776672363e-05, 6.711483001708984e-05, 9.819865226745605e-05, 0.00012928247451782227, 0.00016036629676818848, 0.0001914501190185547, 0.0002225339412689209, 0.0002536177635192871, 0.0002847015857696533, 0.00031578540802001953, 0.00034686923027038574, 0.00037795305252075195, 0.00040903687477111816, 0.0004401206970214844, 0.0004712045192718506, 0.0005022883415222168, 0.000533372163772583, 0.0005644559860229492, 0.0005955398082733154, 0.0006266236305236816, 0.0006577074527740479, 0.0006887912750244141, 0.0007198750972747803, 0.0007509589195251465, 0.0007820427417755127, 0.0008131265640258789, 0.0008442103862762451, 0.0008752942085266113, 0.0009063780307769775, 0.0009374618530273438]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [11.0, 103.0, 857.0, 43.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5036439895629883, -0.2884173095226288, -0.07319062948226929, 0.1420360803604126, 0.3572627305984497, 0.5724893808364868, 0.7877161502838135, 1.0029428005218506, 1.2181694507598877, 1.4333961009979248, 1.648622751235962, 1.8638495206832886, 2.0790762901306152, 2.2943029403686523, 2.5095295906066895, 2.7247562408447266, 2.9399828910827637, 3.155209541320801, 3.370436191558838, 3.585662841796875, 3.800889492034912, 4.016116142272949, 4.2313432693481445, 4.446569442749023, 4.661796569824219, 4.877023220062256, 5.092249870300293, 5.30747652053833, 5.522703170776367, 5.737929821014404, 5.953156471252441, 6.168383598327637, 6.383609771728516, 6.598836421966553, 6.81406307220459, 7.029289722442627, 7.244516372680664, 7.459743022918701, 7.674969673156738, 7.890196800231934, 8.105422973632812, 8.320650100708008, 8.535876274108887, 8.751103401184082, 8.966329574584961, 9.181556701660156, 9.396782875061035, 9.61201000213623, 9.82723617553711, 10.042463302612305, 10.257689476013184, 10.472916603088379, 10.688142776489258, 10.903369903564453, 11.118596076965332, 11.333823204040527, 11.549050331115723, 11.764277458190918, 11.979503631591797, 12.194730758666992, 12.409956932067871, 12.625184059143066, 12.840410232543945, 13.05563735961914, 13.27086353302002]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 14.0, 11.0, 13.0, 13.0, 19.0, 29.0, 28.0, 33.0, 40.0, 44.0, 37.0, 56.0, 43.0, 59.0, 62.0, 57.0, 43.0, 54.0, 40.0, 39.0, 41.0, 36.0, 29.0, 27.0, 19.0, 20.0, 18.0, 19.0, 9.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.081312656402588, -3.939197540283203, -3.7970826625823975, -3.6549675464630127, -3.512852668762207, -3.3707375526428223, -3.2286224365234375, -3.0865073204040527, -2.944392442703247, -2.8022773265838623, -2.6601624488830566, -2.518047332763672, -2.375932216644287, -2.2338173389434814, -2.0917022228240967, -1.9495872259140015, -1.8074722290039062, -1.665357232093811, -1.5232422351837158, -1.381127119064331, -1.2390121221542358, -1.0968971252441406, -0.9547820687294006, -0.8126670122146606, -0.6705520153045654, -0.5284370183944702, -0.3863219618797302, -0.24420693516731262, -0.10209190845489502, 0.040023088455200195, 0.18213814496994019, 0.3242532014846802, 0.4663677215576172, 0.6084827184677124, 0.7505977749824524, 0.8927128314971924, 1.0348278284072876, 1.1769428253173828, 1.3190579414367676, 1.4611729383468628, 1.603287935256958, 1.7454029321670532, 1.8875179290771484, 2.029633045196533, 2.171748161315918, 2.3138630390167236, 2.4559781551361084, 2.598093032836914, 2.740208148956299, 2.8823232650756836, 3.0244381427764893, 3.166553258895874, 3.3086681365966797, 3.4507832527160645, 3.592898368835449, 3.735013484954834, 3.8771283626556396, 4.019243240356445, 4.16135835647583, 4.303473472595215, 4.4455885887146, 4.587703704833984, 4.729818344116211, 4.871933460235596, 5.0140485763549805]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 14.0, 12.0, 12.0, 22.0, 38.0, 36.0, 38.0, 73.0, 92.0, 149.0, 506.0, 27469.0, 4164749.0, 395.0, 132.0, 101.0, 80.0, 53.0, 42.0, 49.0, 38.0, 29.0, 20.0, 17.0, 12.0, 16.0, 11.0, 9.0, 5.0, 7.0, 4.0, 5.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.9990234375, -0.9669036865234375, -0.934783935546875, -0.9026641845703125, -0.87054443359375, -0.8384246826171875, -0.806304931640625, -0.7741851806640625, -0.7420654296875, -0.7099456787109375, -0.677825927734375, -0.6457061767578125, -0.61358642578125, -0.5814666748046875, -0.549346923828125, -0.5172271728515625, -0.485107421875, -0.4529876708984375, -0.420867919921875, -0.3887481689453125, -0.35662841796875, -0.3245086669921875, -0.292388916015625, -0.2602691650390625, -0.2281494140625, -0.1960296630859375, -0.163909912109375, -0.1317901611328125, -0.09967041015625, -0.0675506591796875, -0.035430908203125, -0.0033111572265625, 0.02880859375, 0.0609283447265625, 0.093048095703125, 0.1251678466796875, 0.15728759765625, 0.1894073486328125, 0.221527099609375, 0.2536468505859375, 0.2857666015625, 0.3178863525390625, 0.350006103515625, 0.3821258544921875, 0.41424560546875, 0.4463653564453125, 0.478485107421875, 0.5106048583984375, 0.542724609375, 0.5748443603515625, 0.606964111328125, 0.6390838623046875, 0.67120361328125, 0.7033233642578125, 0.735443115234375, 0.7675628662109375, 0.7996826171875, 0.8318023681640625, 0.863922119140625, 0.8960418701171875, 0.92816162109375, 0.9602813720703125, 0.992401123046875, 1.0245208740234375, 1.056640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 11.0, 3.0, 5.0, 7.0, 6.0, 7.0, 4.0, 13.0, 9.0, 39.0, 163.0, 343.0, 232.0, 52.0, 17.0, 9.0, 3.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1856689453125, -0.17969894409179688, -0.17372894287109375, -0.16775894165039062, -0.1617889404296875, -0.15581893920898438, -0.14984893798828125, -0.14387893676757812, -0.137908935546875, -0.13193893432617188, -0.12596893310546875, -0.11999893188476562, -0.1140289306640625, -0.10805892944335938, -0.10208892822265625, -0.09611892700195312, -0.09014892578125, -0.08417892456054688, -0.07820892333984375, -0.07223892211914062, -0.0662689208984375, -0.060298919677734375, -0.05432891845703125, -0.048358917236328125, -0.042388916015625, -0.036418914794921875, -0.03044891357421875, -0.024478912353515625, -0.0185089111328125, -0.012538909912109375, -0.00656890869140625, -0.000598907470703125, 0.00537109375, 0.011341094970703125, 0.01731109619140625, 0.023281097412109375, 0.0292510986328125, 0.035221099853515625, 0.04119110107421875, 0.047161102294921875, 0.053131103515625, 0.059101104736328125, 0.06507110595703125, 0.07104110717773438, 0.0770111083984375, 0.08298110961914062, 0.08895111083984375, 0.09492111206054688, 0.10089111328125, 0.10686111450195312, 0.11283111572265625, 0.11880111694335938, 0.1247711181640625, 0.13074111938476562, 0.13671112060546875, 0.14268112182617188, 0.148651123046875, 0.15462112426757812, 0.16059112548828125, 0.16656112670898438, 0.1725311279296875, 0.17850112915039062, 0.18447113037109375, 0.19044113159179688, 0.1964111328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 11.0, 13.0, 20.0, 43.0, 163.0, 602.0, 8932.0, 4182179.0, 1957.0, 213.0, 61.0, 26.0, 10.0, 10.0, 8.0, 9.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8273544311523438, -0.7958221435546875, -0.7642898559570312, -0.732757568359375, -0.7012252807617188, -0.6696929931640625, -0.6381607055664062, -0.60662841796875, -0.5750961303710938, -0.5435638427734375, -0.5120315551757812, -0.480499267578125, -0.44896697998046875, -0.4174346923828125, -0.38590240478515625, -0.3543701171875, -0.32283782958984375, -0.2913055419921875, -0.25977325439453125, -0.228240966796875, -0.19670867919921875, -0.1651763916015625, -0.13364410400390625, -0.10211181640625, -0.07057952880859375, -0.0390472412109375, -0.00751495361328125, 0.024017333984375, 0.05554962158203125, 0.0870819091796875, 0.11861419677734375, 0.150146484375, 0.18167877197265625, 0.2132110595703125, 0.24474334716796875, 0.276275634765625, 0.30780792236328125, 0.3393402099609375, 0.37087249755859375, 0.40240478515625, 0.43393707275390625, 0.4654693603515625, 0.49700164794921875, 0.528533935546875, 0.5600662231445312, 0.5915985107421875, 0.6231307983398438, 0.6546630859375, 0.6861953735351562, 0.7177276611328125, 0.7492599487304688, 0.780792236328125, 0.8123245239257812, 0.8438568115234375, 0.8753890991210938, 0.90692138671875, 0.9384536743164062, 0.9699859619140625, 1.0015182495117188, 1.033050537109375, 1.0645828247070312, 1.0961151123046875, 1.1276473999023438, 1.1591796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 10.0, 38.0, 124.0, 3688.0, 122.0, 34.0, 16.0, 5.0, 9.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2522239685058594, -0.24614715576171875, -0.24007034301757812, -0.2339935302734375, -0.22791671752929688, -0.22183990478515625, -0.21576309204101562, -0.209686279296875, -0.20360946655273438, -0.19753265380859375, -0.19145584106445312, -0.1853790283203125, -0.17930221557617188, -0.17322540283203125, -0.16714859008789062, -0.16107177734375, -0.15499496459960938, -0.14891815185546875, -0.14284133911132812, -0.1367645263671875, -0.13068771362304688, -0.12461090087890625, -0.11853408813476562, -0.112457275390625, -0.10638046264648438, -0.10030364990234375, -0.09422683715820312, -0.0881500244140625, -0.08207321166992188, -0.07599639892578125, -0.06991958618164062, -0.0638427734375, -0.057765960693359375, -0.05168914794921875, -0.045612335205078125, -0.0395355224609375, -0.033458709716796875, -0.02738189697265625, -0.021305084228515625, -0.015228271484375, -0.009151458740234375, -0.00307464599609375, 0.003002166748046875, 0.0090789794921875, 0.015155792236328125, 0.02123260498046875, 0.027309417724609375, 0.03338623046875, 0.039463043212890625, 0.04553985595703125, 0.051616668701171875, 0.0576934814453125, 0.06377029418945312, 0.06984710693359375, 0.07592391967773438, 0.082000732421875, 0.08807754516601562, 0.09415435791015625, 0.10023117065429688, 0.1063079833984375, 0.11238479614257812, 0.11846160888671875, 0.12453842163085938, 0.130615234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 144.0, 871.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6258177757263184, -2.577258825302124, -2.528700113296509, -2.4801411628723145, -2.431582450866699, -2.383023500442505, -2.3344647884368896, -2.2859058380126953, -2.23734712600708, -2.1887881755828857, -2.1402294635772705, -2.091670513153076, -2.043111801147461, -1.9945529699325562, -1.9459941387176514, -1.897435188293457, -1.8488763570785522, -1.8003175258636475, -1.7517586946487427, -1.703199863433838, -1.654641032218933, -1.6060822010040283, -1.557523250579834, -1.5089645385742188, -1.4604055881500244, -1.4118467569351196, -1.3632879257202148, -1.31472909450531, -1.2661702632904053, -1.2176114320755005, -1.1690526008605957, -1.1204936504364014, -1.0719348192214966, -1.0233759880065918, -0.974817156791687, -0.9262583255767822, -0.8776994943618774, -0.8291406631469727, -0.7805817723274231, -0.7320229411125183, -0.6834641098976135, -0.6349052786827087, -0.586346447467804, -0.5377875566482544, -0.489228755235672, -0.4406699240207672, -0.39211106300354004, -0.34355223178863525, -0.29499340057373047, -0.24643456935882568, -0.1978757232427597, -0.14931687712669373, -0.10075804591178894, -0.052199214696884155, -0.0036403536796569824, 0.0449184775352478, 0.09347730875015259, 0.14203613996505737, 0.19059498608112335, 0.23915383219718933, 0.2877126634120941, 0.3362714946269989, 0.3848303556442261, 0.43338918685913086, 0.48194801807403564]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 8.0, 9.0, 20.0, 21.0, 37.0, 28.0, 41.0, 49.0, 54.0, 55.0, 66.0, 57.0, 60.0, 61.0, 68.0, 56.0, 65.0, 50.0, 45.0, 34.0, 27.0, 26.0, 14.0, 15.0, 10.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33708566427230835, -0.32614633440971375, -0.31520700454711914, -0.30426767468452454, -0.29332834482192993, -0.2823890149593353, -0.2714496850967407, -0.2605103552341461, -0.2495710253715515, -0.2386316955089569, -0.2276923656463623, -0.2167530357837677, -0.2058137059211731, -0.1948743760585785, -0.1839350461959839, -0.17299571633338928, -0.16205638647079468, -0.15111705660820007, -0.14017772674560547, -0.12923839688301086, -0.11829906702041626, -0.10735973715782166, -0.09642040729522705, -0.08548107743263245, -0.07454174757003784, -0.06360241770744324, -0.05266308784484863, -0.04172375798225403, -0.030784428119659424, -0.01984509825706482, -0.008905768394470215, 0.0020335614681243896, 0.012972891330718994, 0.0239122211933136, 0.0348515510559082, 0.04579088091850281, 0.05673021078109741, 0.06766954064369202, 0.07860887050628662, 0.08954820036888123, 0.10048753023147583, 0.11142686009407043, 0.12236618995666504, 0.13330551981925964, 0.14424484968185425, 0.15518417954444885, 0.16612350940704346, 0.17706283926963806, 0.18800216913223267, 0.19894149899482727, 0.20988082885742188, 0.22082015872001648, 0.23175948858261108, 0.2426988184452057, 0.2536381483078003, 0.2645774781703949, 0.2755168080329895, 0.2864561378955841, 0.2973954677581787, 0.3083347976207733, 0.3192741274833679, 0.3302134573459625, 0.34115278720855713, 0.35209211707115173, 0.36303144693374634]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 8.0, 22.0, 17.0, 19.0, 38.0, 39.0, 57.0, 87.0, 107.0, 114.0, 198.0, 250.0, 346.0, 443.0, 625.0, 797.0, 1073.0, 1620.0, 2318.0, 3527.0, 5740.0, 10024.0, 22383.0, 241004.0, 701982.0, 26178.0, 10901.0, 6142.0, 3777.0, 2552.0, 1658.0, 1175.0, 814.0, 576.0, 480.0, 378.0, 237.0, 194.0, 142.0, 97.0, 85.0, 56.0, 61.0, 40.0, 31.0, 30.0, 21.0, 15.0, 10.0, 13.0, 10.0, 9.0, 7.0, 1.0, 3.0, 4.0, 3.0], "bins": [-0.2198486328125, -0.21277427673339844, -0.20569992065429688, -0.1986255645751953, -0.19155120849609375, -0.1844768524169922, -0.17740249633789062, -0.17032814025878906, -0.1632537841796875, -0.15617942810058594, -0.14910507202148438, -0.1420307159423828, -0.13495635986328125, -0.1278820037841797, -0.12080764770507812, -0.11373329162597656, -0.106658935546875, -0.09958457946777344, -0.09251022338867188, -0.08543586730957031, -0.07836151123046875, -0.07128715515136719, -0.06421279907226562, -0.05713844299316406, -0.0500640869140625, -0.04298973083496094, -0.035915374755859375, -0.028841018676757812, -0.02176666259765625, -0.014692306518554688, -0.007617950439453125, -0.0005435943603515625, 0.00653076171875, 0.013605117797851562, 0.020679473876953125, 0.027753829956054688, 0.03482818603515625, 0.04190254211425781, 0.048976898193359375, 0.05605125427246094, 0.0631256103515625, 0.07019996643066406, 0.07727432250976562, 0.08434867858886719, 0.09142303466796875, 0.09849739074707031, 0.10557174682617188, 0.11264610290527344, 0.119720458984375, 0.12679481506347656, 0.13386917114257812, 0.1409435272216797, 0.14801788330078125, 0.1550922393798828, 0.16216659545898438, 0.16924095153808594, 0.1763153076171875, 0.18338966369628906, 0.19046401977539062, 0.1975383758544922, 0.20461273193359375, 0.2116870880126953, 0.21876144409179688, 0.22583580017089844, 0.23291015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 11.0, 3.0, 5.0, 7.0, 6.0, 7.0, 4.0, 13.0, 10.0, 39.0, 164.0, 341.0, 235.0, 50.0, 16.0, 9.0, 3.0, 7.0, 7.0, 8.0, 5.0, 3.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1854248046875, -0.1794605255126953, -0.17349624633789062, -0.16753196716308594, -0.16156768798828125, -0.15560340881347656, -0.14963912963867188, -0.1436748504638672, -0.1377105712890625, -0.1317462921142578, -0.12578201293945312, -0.11981773376464844, -0.11385345458984375, -0.10788917541503906, -0.10192489624023438, -0.09596061706542969, -0.089996337890625, -0.08403205871582031, -0.07806777954101562, -0.07210350036621094, -0.06613922119140625, -0.06017494201660156, -0.054210662841796875, -0.04824638366699219, -0.0422821044921875, -0.03631782531738281, -0.030353546142578125, -0.024389266967773438, -0.01842498779296875, -0.012460708618164062, -0.006496429443359375, -0.0005321502685546875, 0.00543212890625, 0.011396408081054688, 0.017360687255859375, 0.023324966430664062, 0.02928924560546875, 0.03525352478027344, 0.041217803955078125, 0.04718208312988281, 0.0531463623046875, 0.05911064147949219, 0.06507492065429688, 0.07103919982910156, 0.07700347900390625, 0.08296775817871094, 0.08893203735351562, 0.09489631652832031, 0.100860595703125, 0.10682487487792969, 0.11278915405273438, 0.11875343322753906, 0.12471771240234375, 0.13068199157714844, 0.13664627075195312, 0.1426105499267578, 0.1485748291015625, 0.1545391082763672, 0.16050338745117188, 0.16646766662597656, 0.17243194580078125, 0.17839622497558594, 0.18436050415039062, 0.1903247833251953, 0.1962890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 3.0, 6.0, 9.0, 10.0, 21.0, 19.0, 16.0, 21.0, 27.0, 36.0, 45.0, 49.0, 73.0, 76.0, 86.0, 106.0, 169.0, 225.0, 394.0, 630.0, 1302.0, 5076.0, 272182.0, 756533.0, 7782.0, 1498.0, 713.0, 391.0, 251.0, 157.0, 110.0, 89.0, 84.0, 66.0, 45.0, 45.0, 37.0, 27.0, 32.0, 26.0, 11.0, 17.0, 14.0, 9.0, 13.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72802734375, -0.7053298950195312, -0.6826324462890625, -0.6599349975585938, -0.637237548828125, -0.6145401000976562, -0.5918426513671875, -0.5691452026367188, -0.54644775390625, -0.5237503051757812, -0.5010528564453125, -0.47835540771484375, -0.455657958984375, -0.43296051025390625, -0.4102630615234375, -0.38756561279296875, -0.3648681640625, -0.34217071533203125, -0.3194732666015625, -0.29677581787109375, -0.274078369140625, -0.25138092041015625, -0.2286834716796875, -0.20598602294921875, -0.18328857421875, -0.16059112548828125, -0.1378936767578125, -0.11519622802734375, -0.092498779296875, -0.06980133056640625, -0.0471038818359375, -0.02440643310546875, -0.001708984375, 0.02098846435546875, 0.0436859130859375, 0.06638336181640625, 0.089080810546875, 0.11177825927734375, 0.1344757080078125, 0.15717315673828125, 0.17987060546875, 0.20256805419921875, 0.2252655029296875, 0.24796295166015625, 0.270660400390625, 0.29335784912109375, 0.3160552978515625, 0.33875274658203125, 0.3614501953125, 0.38414764404296875, 0.4068450927734375, 0.42954254150390625, 0.452239990234375, 0.47493743896484375, 0.4976348876953125, 0.5203323364257812, 0.54302978515625, 0.5657272338867188, 0.5884246826171875, 0.6111221313476562, 0.633819580078125, 0.6565170288085938, 0.6792144775390625, 0.7019119262695312, 0.724609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 8.0, 5.0, 11.0, 9.0, 7.0, 11.0, 11.0, 16.0, 21.0, 18.0, 32.0, 24.0, 25.0, 25.0, 28.0, 28.0, 38.0, 37.0, 45.0, 34.0, 45.0, 41.0, 37.0, 40.0, 35.0, 37.0, 40.0, 26.0, 34.0, 32.0, 33.0, 24.0, 17.0, 22.0, 16.0, 11.0, 15.0, 14.0, 4.0, 10.0, 7.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.48828125, -0.4730644226074219, -0.45784759521484375, -0.4426307678222656, -0.4274139404296875, -0.4121971130371094, -0.39698028564453125, -0.3817634582519531, -0.366546630859375, -0.3513298034667969, -0.33611297607421875, -0.3208961486816406, -0.3056793212890625, -0.2904624938964844, -0.27524566650390625, -0.2600288391113281, -0.24481201171875, -0.22959518432617188, -0.21437835693359375, -0.19916152954101562, -0.1839447021484375, -0.16872787475585938, -0.15351104736328125, -0.13829421997070312, -0.123077392578125, -0.10786056518554688, -0.09264373779296875, -0.07742691040039062, -0.0622100830078125, -0.046993255615234375, -0.03177642822265625, -0.016559600830078125, -0.0013427734375, 0.013874053955078125, 0.02909088134765625, 0.044307708740234375, 0.0595245361328125, 0.07474136352539062, 0.08995819091796875, 0.10517501831054688, 0.120391845703125, 0.13560867309570312, 0.15082550048828125, 0.16604232788085938, 0.1812591552734375, 0.19647598266601562, 0.21169281005859375, 0.22690963745117188, 0.24212646484375, 0.2573432922363281, 0.27256011962890625, 0.2877769470214844, 0.3029937744140625, 0.3182106018066406, 0.33342742919921875, 0.3486442565917969, 0.363861083984375, 0.3790779113769531, 0.39429473876953125, 0.4095115661621094, 0.4247283935546875, 0.4399452209472656, 0.45516204833984375, 0.4703788757324219, 0.485595703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 9.0, 9.0, 6.0, 15.0, 15.0, 23.0, 21.0, 32.0, 59.0, 114.0, 176.0, 374.0, 1049.0, 5185.0, 106592.0, 921763.0, 10299.0, 1725.0, 549.0, 185.0, 130.0, 65.0, 54.0, 27.0, 19.0, 16.0, 7.0, 11.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008306503295898438, -0.0008039921522140503, -0.0007773339748382568, -0.0007506757974624634, -0.0007240176200866699, -0.0006973594427108765, -0.000670701265335083, -0.0006440430879592896, -0.0006173849105834961, -0.0005907267332077026, -0.0005640685558319092, -0.0005374103784561157, -0.0005107522010803223, -0.0004840940237045288, -0.00045743584632873535, -0.0004307776689529419, -0.00040411949157714844, -0.000377461314201355, -0.0003508031368255615, -0.00032414495944976807, -0.0002974867820739746, -0.00027082860469818115, -0.0002441704273223877, -0.00021751224994659424, -0.00019085407257080078, -0.00016419589519500732, -0.00013753771781921387, -0.00011087954044342041, -8.422136306762695e-05, -5.7563185691833496e-05, -3.090500831604004e-05, -4.246830940246582e-06, 2.2411346435546875e-05, 4.906952381134033e-05, 7.572770118713379e-05, 0.00010238587856292725, 0.0001290440559387207, 0.00015570223331451416, 0.00018236041069030762, 0.00020901858806610107, 0.00023567676544189453, 0.000262334942817688, 0.00028899312019348145, 0.0003156512975692749, 0.00034230947494506836, 0.0003689676523208618, 0.0003956258296966553, 0.00042228400707244873, 0.0004489421844482422, 0.00047560036182403564, 0.0005022585391998291, 0.0005289167165756226, 0.000555574893951416, 0.0005822330713272095, 0.0006088912487030029, 0.0006355494260787964, 0.0006622076034545898, 0.0006888657808303833, 0.0007155239582061768, 0.0007421821355819702, 0.0007688403129577637, 0.0007954984903335571, 0.0008221566677093506, 0.000848814845085144, 0.0008754730224609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 5.0, 1.0, 6.0, 7.0, 7.0, 22.0, 14.0, 19.0, 13.0, 34.0, 12.0, 23.0, 45.0, 23.0, 53.0, 30.0, 37.0, 80.0, 33.0, 67.0, 30.0, 82.0, 36.0, 27.0, 63.0, 35.0, 44.0, 23.0, 30.0, 17.0, 15.0, 22.0, 9.0, 12.0, 5.0, 4.0, 4.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.359040081501007e-06, -2.2742897272109985e-06, -2.18953937292099e-06, -2.1047890186309814e-06, -2.020038664340973e-06, -1.9352883100509644e-06, -1.8505379557609558e-06, -1.7657876014709473e-06, -1.6810372471809387e-06, -1.5962868928909302e-06, -1.5115365386009216e-06, -1.426786184310913e-06, -1.3420358300209045e-06, -1.257285475730896e-06, -1.1725351214408875e-06, -1.087784767150879e-06, -1.0030344128608704e-06, -9.182840585708618e-07, -8.335337042808533e-07, -7.487833499908447e-07, -6.640329957008362e-07, -5.792826414108276e-07, -4.945322871208191e-07, -4.0978193283081055e-07, -3.25031578540802e-07, -2.4028122425079346e-07, -1.555308699607849e-07, -7.078051567077637e-08, 1.3969838619232178e-08, 9.872019290924072e-08, 1.8347054719924927e-07, 2.682209014892578e-07, 3.5297125577926636e-07, 4.377216100692749e-07, 5.224719643592834e-07, 6.07222318649292e-07, 6.919726729393005e-07, 7.767230272293091e-07, 8.614733815193176e-07, 9.462237358093262e-07, 1.0309740900993347e-06, 1.1157244443893433e-06, 1.2004747986793518e-06, 1.2852251529693604e-06, 1.369975507259369e-06, 1.4547258615493774e-06, 1.539476215839386e-06, 1.6242265701293945e-06, 1.708976924419403e-06, 1.7937272787094116e-06, 1.8784776329994202e-06, 1.9632279872894287e-06, 2.0479783415794373e-06, 2.132728695869446e-06, 2.2174790501594543e-06, 2.302229404449463e-06, 2.3869797587394714e-06, 2.47173011302948e-06, 2.5564804673194885e-06, 2.641230821609497e-06, 2.7259811758995056e-06, 2.810731530189514e-06, 2.8954818844795227e-06, 2.9802322387695312e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 11.0, 9.0, 23.0, 23.0, 32.0, 55.0, 87.0, 158.0, 426.0, 2013.0, 968214.0, 75401.0, 1323.0, 350.0, 142.0, 84.0, 48.0, 32.0, 23.0, 23.0, 9.0, 10.0, 4.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.001434326171875, -0.0013863742351531982, -0.0013384222984313965, -0.0012904703617095947, -0.001242518424987793, -0.0011945664882659912, -0.0011466145515441895, -0.0010986626148223877, -0.001050710678100586, -0.0010027587413787842, -0.0009548068046569824, -0.0009068548679351807, -0.0008589029312133789, -0.0008109509944915771, -0.0007629990577697754, -0.0007150471210479736, -0.0006670951843261719, -0.0006191432476043701, -0.0005711913108825684, -0.0005232393741607666, -0.00047528743743896484, -0.0004273355007171631, -0.00037938356399536133, -0.00033143162727355957, -0.0002834796905517578, -0.00023552775382995605, -0.0001875758171081543, -0.00013962388038635254, -9.167194366455078e-05, -4.3720006942749023e-05, 4.231929779052734e-06, 5.218386650085449e-05, 0.00010013580322265625, 0.000148087739944458, 0.00019603967666625977, 0.00024399161338806152, 0.0002919435501098633, 0.00033989548683166504, 0.0003878474235534668, 0.00043579936027526855, 0.0004837512969970703, 0.0005317032337188721, 0.0005796551704406738, 0.0006276071071624756, 0.0006755590438842773, 0.0007235109806060791, 0.0007714629173278809, 0.0008194148540496826, 0.0008673667907714844, 0.0009153187274932861, 0.0009632706642150879, 0.0010112226009368896, 0.0010591745376586914, 0.0011071264743804932, 0.001155078411102295, 0.0012030303478240967, 0.0012509822845458984, 0.0012989342212677002, 0.001346886157989502, 0.0013948380947113037, 0.0014427900314331055, 0.0014907419681549072, 0.001538693904876709, 0.0015866458415985107, 0.0016345977783203125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 7.0, 7.0, 5.0, 13.0, 16.0, 24.0, 23.0, 48.0, 126.0, 174.0, 199.0, 126.0, 86.0, 50.0, 19.0, 16.0, 13.0, 7.0, 4.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0007562637329101562, -0.0007273107767105103, -0.0006983578205108643, -0.0006694048643112183, -0.0006404519081115723, -0.0006114989519119263, -0.0005825459957122803, -0.0005535930395126343, -0.0005246400833129883, -0.0004956871271133423, -0.0004667341709136963, -0.0004377812147140503, -0.0004088282585144043, -0.0003798753023147583, -0.0003509223461151123, -0.0003219693899154663, -0.0002930164337158203, -0.0002640634775161743, -0.00023511052131652832, -0.00020615756511688232, -0.00017720460891723633, -0.00014825165271759033, -0.00011929869651794434, -9.034574031829834e-05, -6.139278411865234e-05, -3.243982791900635e-05, -3.4868717193603516e-06, 2.5466084480285645e-05, 5.441904067993164e-05, 8.337199687957764e-05, 0.00011232495307922363, 0.00014127790927886963, 0.00017023086547851562, 0.00019918382167816162, 0.00022813677787780762, 0.0002570897340774536, 0.0002860426902770996, 0.0003149956464767456, 0.0003439486026763916, 0.0003729015588760376, 0.0004018545150756836, 0.0004308074712753296, 0.0004597604274749756, 0.0004887133836746216, 0.0005176663398742676, 0.0005466192960739136, 0.0005755722522735596, 0.0006045252084732056, 0.0006334781646728516, 0.0006624311208724976, 0.0006913840770721436, 0.0007203370332717896, 0.0007492899894714355, 0.0007782429456710815, 0.0008071959018707275, 0.0008361488580703735, 0.0008651018142700195, 0.0008940547704696655, 0.0009230077266693115, 0.0009519606828689575, 0.0009809136390686035, 0.0010098665952682495, 0.0010388195514678955, 0.0010677725076675415, 0.0010967254638671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 97.0, 896.0, 16.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.209573268890381, -6.979009628295898, -6.748445987701416, -6.517882347106934, -6.287319183349609, -6.056755065917969, -5.8261919021606445, -5.595628261566162, -5.36506462097168, -5.134500980377197, -4.903937339782715, -4.673373699188232, -4.44281005859375, -4.212246894836426, -3.9816832542419434, -3.751119613647461, -3.5205559730529785, -3.289992332458496, -3.0594286918640137, -2.8288652896881104, -2.598301649093628, -2.3677380084991455, -2.137174606323242, -1.9066109657287598, -1.6760473251342773, -1.445483684539795, -1.214920163154602, -0.9843565821647644, -0.7537930011749268, -0.5232293605804443, -0.29266583919525146, -0.062102317810058594, 0.16846179962158203, 0.3990253806114197, 0.6295889616012573, 0.860152542591095, 1.0907161235809326, 1.321279764175415, 1.551843285560608, 1.7824068069458008, 2.012970447540283, 2.2435340881347656, 2.474097728729248, 2.7046611309051514, 2.935224771499634, 3.165788412094116, 3.3963518142700195, 3.626915454864502, 3.8574790954589844, 4.088042736053467, 4.318606376647949, 4.549170017242432, 4.779733657836914, 5.010296821594238, 5.240860462188721, 5.471424102783203, 5.7019877433776855, 5.932551383972168, 6.16311502456665, 6.393678665161133, 6.624241828918457, 6.854805946350098, 7.085369110107422, 7.315932750701904, 7.546496391296387]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 8.0, 5.0, 12.0, 18.0, 21.0, 22.0, 26.0, 30.0, 38.0, 42.0, 50.0, 51.0, 59.0, 62.0, 68.0, 59.0, 67.0, 52.0, 46.0, 49.0, 35.0, 33.0, 26.0, 26.0, 15.0, 19.0, 11.0, 12.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-5.097583770751953, -4.9691996574401855, -4.840816020965576, -4.712431907653809, -4.584048271179199, -4.455664157867432, -4.327280044555664, -4.198896408081055, -4.070512294769287, -3.9421284198760986, -3.81374454498291, -3.6853604316711426, -3.556976556777954, -3.4285926818847656, -3.300208568572998, -3.1718246936798096, -3.043440818786621, -2.9150569438934326, -2.786673069000244, -2.6582889556884766, -2.529905080795288, -2.4015212059020996, -2.273137092590332, -2.1447532176971436, -2.016369342803955, -1.8879854679107666, -1.7596014738082886, -1.6312174797058105, -1.502833604812622, -1.3744497299194336, -1.2460657358169556, -1.1176817417144775, -0.9892981052398682, -0.8609141707420349, -0.7325302362442017, -0.6041463017463684, -0.47576236724853516, -0.3473784327507019, -0.21899449825286865, -0.0906105637550354, 0.03777337074279785, 0.1661573052406311, 0.29454123973846436, 0.4229251742362976, 0.5513091087341309, 0.6796930432319641, 0.8080769777297974, 0.9364609122276306, 1.0648448467254639, 1.1932287216186523, 1.3216127157211304, 1.4499967098236084, 1.5783805847167969, 1.7067644596099854, 1.8351484537124634, 1.9635324478149414, 2.09191632270813, 2.2203001976013184, 2.348684310913086, 2.4770681858062744, 2.605452060699463, 2.7338359355926514, 2.86221981048584, 2.9906039237976074, 3.118987798690796]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 4.0, 9.0, 9.0, 13.0, 18.0, 13.0, 27.0, 24.0, 58.0, 58.0, 98.0, 117.0, 200.0, 408.0, 12832.0, 593883.0, 3579028.0, 6100.0, 401.0, 244.0, 172.0, 108.0, 109.0, 76.0, 45.0, 38.0, 26.0, 30.0, 14.0, 26.0, 21.0, 13.0, 10.0, 9.0, 5.0, 5.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.548828125, -0.5311279296875, -0.513427734375, -0.4957275390625, -0.47802734375, -0.4603271484375, -0.442626953125, -0.4249267578125, -0.4072265625, -0.3895263671875, -0.371826171875, -0.3541259765625, -0.33642578125, -0.3187255859375, -0.301025390625, -0.2833251953125, -0.265625, -0.2479248046875, -0.230224609375, -0.2125244140625, -0.19482421875, -0.1771240234375, -0.159423828125, -0.1417236328125, -0.1240234375, -0.1063232421875, -0.088623046875, -0.0709228515625, -0.05322265625, -0.0355224609375, -0.017822265625, -0.0001220703125, 0.017578125, 0.0352783203125, 0.052978515625, 0.0706787109375, 0.08837890625, 0.1060791015625, 0.123779296875, 0.1414794921875, 0.1591796875, 0.1768798828125, 0.194580078125, 0.2122802734375, 0.22998046875, 0.2476806640625, 0.265380859375, 0.2830810546875, 0.30078125, 0.3184814453125, 0.336181640625, 0.3538818359375, 0.37158203125, 0.3892822265625, 0.406982421875, 0.4246826171875, 0.4423828125, 0.4600830078125, 0.477783203125, 0.4954833984375, 0.51318359375, 0.5308837890625, 0.548583984375, 0.5662841796875, 0.583984375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 10.0, 3.0, 4.0, 6.0, 7.0, 11.0, 5.0, 7.0, 16.0, 53.0, 185.0, 325.0, 211.0, 50.0, 14.0, 10.0, 5.0, 6.0, 8.0, 7.0, 5.0, 4.0, 6.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.179931640625, -0.17412948608398438, -0.16832733154296875, -0.16252517700195312, -0.1567230224609375, -0.15092086791992188, -0.14511871337890625, -0.13931655883789062, -0.133514404296875, -0.12771224975585938, -0.12191009521484375, -0.11610794067382812, -0.1103057861328125, -0.10450363159179688, -0.09870147705078125, -0.09289932250976562, -0.08709716796875, -0.08129501342773438, -0.07549285888671875, -0.06969070434570312, -0.0638885498046875, -0.058086395263671875, -0.05228424072265625, -0.046482086181640625, -0.040679931640625, -0.034877777099609375, -0.02907562255859375, -0.023273468017578125, -0.0174713134765625, -0.011669158935546875, -0.00586700439453125, -6.4849853515625e-05, 0.0057373046875, 0.011539459228515625, 0.01734161376953125, 0.023143768310546875, 0.0289459228515625, 0.034748077392578125, 0.04055023193359375, 0.046352386474609375, 0.052154541015625, 0.057956695556640625, 0.06375885009765625, 0.06956100463867188, 0.0753631591796875, 0.08116531372070312, 0.08696746826171875, 0.09276962280273438, 0.09857177734375, 0.10437393188476562, 0.11017608642578125, 0.11597824096679688, 0.1217803955078125, 0.12758255004882812, 0.13338470458984375, 0.13918685913085938, 0.144989013671875, 0.15079116821289062, 0.15659332275390625, 0.16239547729492188, 0.1681976318359375, 0.17399978637695312, 0.17980194091796875, 0.18560409545898438, 0.19140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 9.0, 0.0, 5.0, 1.0, 6.0, 12.0, 15.0, 31.0, 36.0, 49.0, 96.0, 346.0, 1587.0, 88982.0, 4099785.0, 2624.0, 399.0, 131.0, 48.0, 42.0, 24.0, 17.0, 14.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9248046875, -0.8959732055664062, -0.8671417236328125, -0.8383102416992188, -0.809478759765625, -0.7806472778320312, -0.7518157958984375, -0.7229843139648438, -0.69415283203125, -0.6653213500976562, -0.6364898681640625, -0.6076583862304688, -0.578826904296875, -0.5499954223632812, -0.5211639404296875, -0.49233245849609375, -0.4635009765625, -0.43466949462890625, -0.4058380126953125, -0.37700653076171875, -0.348175048828125, -0.31934356689453125, -0.2905120849609375, -0.26168060302734375, -0.23284912109375, -0.20401763916015625, -0.1751861572265625, -0.14635467529296875, -0.117523193359375, -0.08869171142578125, -0.0598602294921875, -0.03102874755859375, -0.002197265625, 0.02663421630859375, 0.0554656982421875, 0.08429718017578125, 0.113128662109375, 0.14196014404296875, 0.1707916259765625, 0.19962310791015625, 0.22845458984375, 0.25728607177734375, 0.2861175537109375, 0.31494903564453125, 0.343780517578125, 0.37261199951171875, 0.4014434814453125, 0.43027496337890625, 0.4591064453125, 0.48793792724609375, 0.5167694091796875, 0.5456008911132812, 0.574432373046875, 0.6032638549804688, 0.6320953369140625, 0.6609268188476562, 0.68975830078125, 0.7185897827148438, 0.7474212646484375, 0.7762527465820312, 0.805084228515625, 0.8339157104492188, 0.8627471923828125, 0.8915786743164062, 0.92041015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 42.0, 204.0, 2353.0, 1172.0, 187.0, 42.0, 13.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3212890625, -0.31122589111328125, -0.3011627197265625, -0.29109954833984375, -0.281036376953125, -0.27097320556640625, -0.2609100341796875, -0.25084686279296875, -0.24078369140625, -0.23072052001953125, -0.2206573486328125, -0.21059417724609375, -0.200531005859375, -0.19046783447265625, -0.1804046630859375, -0.17034149169921875, -0.1602783203125, -0.15021514892578125, -0.1401519775390625, -0.13008880615234375, -0.120025634765625, -0.10996246337890625, -0.0998992919921875, -0.08983612060546875, -0.07977294921875, -0.06970977783203125, -0.0596466064453125, -0.04958343505859375, -0.039520263671875, -0.02945709228515625, -0.0193939208984375, -0.00933074951171875, 0.000732421875, 0.01079559326171875, 0.0208587646484375, 0.03092193603515625, 0.040985107421875, 0.05104827880859375, 0.0611114501953125, 0.07117462158203125, 0.08123779296875, 0.09130096435546875, 0.1013641357421875, 0.11142730712890625, 0.121490478515625, 0.13155364990234375, 0.1416168212890625, 0.15167999267578125, 0.1617431640625, 0.17180633544921875, 0.1818695068359375, 0.19193267822265625, 0.201995849609375, 0.21205902099609375, 0.2221221923828125, 0.23218536376953125, 0.24224853515625, 0.25231170654296875, 0.2623748779296875, 0.27243804931640625, 0.282501220703125, 0.29256439208984375, 0.3026275634765625, 0.31269073486328125, 0.32275390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 991.0, 21.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5510613918304443, -1.4633548259735107, -1.3756483793258667, -1.2879419326782227, -1.200235366821289, -1.1125288009643555, -1.0248223543167114, -0.9371158480644226, -0.8494093418121338, -0.761702835559845, -0.6739963293075562, -0.5862898230552673, -0.4985833168029785, -0.4108768105506897, -0.3231703042984009, -0.23546379804611206, -0.14775729179382324, -0.060050785541534424, 0.027655720710754395, 0.11536222696304321, 0.20306873321533203, 0.29077523946762085, 0.37848174571990967, 0.4661882519721985, 0.5538947582244873, 0.6416012644767761, 0.7293077707290649, 0.8170142769813538, 0.9047207832336426, 0.9924272894859314, 1.0801337957382202, 1.1678402423858643, 1.2555465698242188, 1.3432531356811523, 1.4309595823287964, 1.5186660289764404, 1.606372594833374, 1.6940791606903076, 1.7817856073379517, 1.8694920539855957, 1.9571986198425293, 2.044905185699463, 2.1326117515563965, 2.220318078994751, 2.3080246448516846, 2.395731210708618, 2.4834375381469727, 2.5711441040039062, 2.65885066986084, 2.7465572357177734, 2.834263801574707, 2.9219701290130615, 3.009676694869995, 3.0973832607269287, 3.185089588165283, 3.272796154022217, 3.3605027198791504, 3.448209285736084, 3.5359158515930176, 3.623622179031372, 3.7113287448883057, 3.7990353107452393, 3.8867416381835938, 3.9744482040405273, 4.062154769897461]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 3.0, 9.0, 12.0, 14.0, 16.0, 26.0, 32.0, 29.0, 53.0, 56.0, 57.0, 53.0, 51.0, 66.0, 50.0, 63.0, 57.0, 45.0, 61.0, 37.0, 43.0, 28.0, 30.0, 15.0, 30.0, 14.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5997762084007263, -0.5801371335983276, -0.560498058795929, -0.5408589839935303, -0.5212199091911316, -0.5015808343887329, -0.48194175958633423, -0.46230268478393555, -0.44266360998153687, -0.4230245351791382, -0.4033854603767395, -0.3837463855743408, -0.36410731077194214, -0.34446823596954346, -0.3248291611671448, -0.3051900863647461, -0.2855510115623474, -0.26591193675994873, -0.24627286195755005, -0.22663378715515137, -0.20699471235275269, -0.187355637550354, -0.16771656274795532, -0.14807748794555664, -0.12843841314315796, -0.10879933834075928, -0.0891602635383606, -0.06952118873596191, -0.04988211393356323, -0.03024303913116455, -0.01060396432876587, 0.009035110473632812, 0.028674185276031494, 0.048313260078430176, 0.06795233488082886, 0.08759140968322754, 0.10723048448562622, 0.1268695592880249, 0.14650863409042358, 0.16614770889282227, 0.18578678369522095, 0.20542585849761963, 0.2250649333000183, 0.244704008102417, 0.2643430829048157, 0.28398215770721436, 0.30362123250961304, 0.3232603073120117, 0.3428993821144104, 0.3625384569168091, 0.38217753171920776, 0.40181660652160645, 0.4214556813240051, 0.4410947561264038, 0.4607338309288025, 0.48037290573120117, 0.5000119805335999, 0.5196510553359985, 0.5392901301383972, 0.5589292049407959, 0.5785682797431946, 0.5982073545455933, 0.6178464293479919, 0.6374855041503906, 0.6571245789527893]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 13.0, 10.0, 19.0, 20.0, 24.0, 36.0, 46.0, 62.0, 68.0, 95.0, 156.0, 188.0, 285.0, 441.0, 573.0, 794.0, 1119.0, 1587.0, 2367.0, 3650.0, 6093.0, 10891.0, 24546.0, 565315.0, 378814.0, 23407.0, 10398.0, 6001.0, 3582.0, 2397.0, 1605.0, 1073.0, 857.0, 572.0, 401.0, 291.0, 199.0, 159.0, 103.0, 80.0, 50.0, 36.0, 29.0, 28.0, 18.0, 11.0, 11.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.2257080078125, -0.21886444091796875, -0.2120208740234375, -0.20517730712890625, -0.198333740234375, -0.19149017333984375, -0.1846466064453125, -0.17780303955078125, -0.17095947265625, -0.16411590576171875, -0.1572723388671875, -0.15042877197265625, -0.143585205078125, -0.13674163818359375, -0.1298980712890625, -0.12305450439453125, -0.1162109375, -0.10936737060546875, -0.1025238037109375, -0.09568023681640625, -0.088836669921875, -0.08199310302734375, -0.0751495361328125, -0.06830596923828125, -0.06146240234375, -0.05461883544921875, -0.0477752685546875, -0.04093170166015625, -0.034088134765625, -0.02724456787109375, -0.0204010009765625, -0.01355743408203125, -0.0067138671875, 0.00012969970703125, 0.0069732666015625, 0.01381683349609375, 0.020660400390625, 0.02750396728515625, 0.0343475341796875, 0.04119110107421875, 0.04803466796875, 0.05487823486328125, 0.0617218017578125, 0.06856536865234375, 0.075408935546875, 0.08225250244140625, 0.0890960693359375, 0.09593963623046875, 0.102783203125, 0.10962677001953125, 0.1164703369140625, 0.12331390380859375, 0.130157470703125, 0.13700103759765625, 0.1438446044921875, 0.15068817138671875, 0.15753173828125, 0.16437530517578125, 0.1712188720703125, 0.17806243896484375, 0.184906005859375, 0.19174957275390625, 0.1985931396484375, 0.20543670654296875, 0.2122802734375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 8.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 7.0, 17.0, 54.0, 191.0, 318.0, 213.0, 47.0, 15.0, 9.0, 6.0, 6.0, 8.0, 7.0, 5.0, 4.0, 6.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1800537109375, -0.17424583435058594, -0.16843795776367188, -0.1626300811767578, -0.15682220458984375, -0.1510143280029297, -0.14520645141601562, -0.13939857482910156, -0.1335906982421875, -0.12778282165527344, -0.12197494506835938, -0.11616706848144531, -0.11035919189453125, -0.10455131530761719, -0.09874343872070312, -0.09293556213378906, -0.087127685546875, -0.08131980895996094, -0.07551193237304688, -0.06970405578613281, -0.06389617919921875, -0.05808830261230469, -0.052280426025390625, -0.04647254943847656, -0.0406646728515625, -0.03485679626464844, -0.029048919677734375, -0.023241043090820312, -0.01743316650390625, -0.011625289916992188, -0.005817413330078125, -9.5367431640625e-06, 0.00579833984375, 0.011606216430664062, 0.017414093017578125, 0.023221969604492188, 0.02902984619140625, 0.03483772277832031, 0.040645599365234375, 0.04645347595214844, 0.0522613525390625, 0.05806922912597656, 0.06387710571289062, 0.06968498229980469, 0.07549285888671875, 0.08130073547363281, 0.08710861206054688, 0.09291648864746094, 0.098724365234375, 0.10453224182128906, 0.11034011840820312, 0.11614799499511719, 0.12195587158203125, 0.1277637481689453, 0.13357162475585938, 0.13937950134277344, 0.1451873779296875, 0.15099525451660156, 0.15680313110351562, 0.1626110076904297, 0.16841888427734375, 0.1742267608642578, 0.18003463745117188, 0.18584251403808594, 0.191650390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 15.0, 10.0, 15.0, 24.0, 27.0, 47.0, 48.0, 37.0, 49.0, 69.0, 89.0, 102.0, 119.0, 186.0, 277.0, 476.0, 884.0, 2997.0, 89832.0, 939685.0, 10234.0, 1347.0, 585.0, 386.0, 231.0, 161.0, 117.0, 76.0, 75.0, 60.0, 35.0, 45.0, 47.0, 33.0, 26.0, 20.0, 13.0, 13.0, 7.0, 9.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6767578125, -0.6551055908203125, -0.633453369140625, -0.6118011474609375, -0.59014892578125, -0.5684967041015625, -0.546844482421875, -0.5251922607421875, -0.5035400390625, -0.4818878173828125, -0.460235595703125, -0.4385833740234375, -0.41693115234375, -0.3952789306640625, -0.373626708984375, -0.3519744873046875, -0.330322265625, -0.3086700439453125, -0.287017822265625, -0.2653656005859375, -0.24371337890625, -0.2220611572265625, -0.200408935546875, -0.1787567138671875, -0.1571044921875, -0.1354522705078125, -0.113800048828125, -0.0921478271484375, -0.07049560546875, -0.0488433837890625, -0.027191162109375, -0.0055389404296875, 0.01611328125, 0.0377655029296875, 0.059417724609375, 0.0810699462890625, 0.10272216796875, 0.1243743896484375, 0.146026611328125, 0.1676788330078125, 0.1893310546875, 0.2109832763671875, 0.232635498046875, 0.2542877197265625, 0.27593994140625, 0.2975921630859375, 0.319244384765625, 0.3408966064453125, 0.362548828125, 0.3842010498046875, 0.405853271484375, 0.4275054931640625, 0.44915771484375, 0.4708099365234375, 0.492462158203125, 0.5141143798828125, 0.5357666015625, 0.5574188232421875, 0.579071044921875, 0.6007232666015625, 0.62237548828125, 0.6440277099609375, 0.665679931640625, 0.6873321533203125, 0.708984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 8.0, 8.0, 13.0, 18.0, 18.0, 11.0, 25.0, 29.0, 30.0, 28.0, 22.0, 35.0, 39.0, 42.0, 39.0, 38.0, 46.0, 44.0, 49.0, 47.0, 43.0, 46.0, 28.0, 45.0, 29.0, 19.0, 20.0, 24.0, 16.0, 17.0, 25.0, 22.0, 15.0, 13.0, 7.0, 5.0, 4.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.4976806640625, -0.481201171875, -0.4647216796875, -0.4482421875, -0.4317626953125, -0.415283203125, -0.3988037109375, -0.38232421875, -0.3658447265625, -0.349365234375, -0.3328857421875, -0.31640625, -0.2999267578125, -0.283447265625, -0.2669677734375, -0.25048828125, -0.2340087890625, -0.217529296875, -0.2010498046875, -0.1845703125, -0.1680908203125, -0.151611328125, -0.1351318359375, -0.11865234375, -0.1021728515625, -0.085693359375, -0.0692138671875, -0.052734375, -0.0362548828125, -0.019775390625, -0.0032958984375, 0.01318359375, 0.0296630859375, 0.046142578125, 0.0626220703125, 0.0791015625, 0.0955810546875, 0.112060546875, 0.1285400390625, 0.14501953125, 0.1614990234375, 0.177978515625, 0.1944580078125, 0.2109375, 0.2274169921875, 0.243896484375, 0.2603759765625, 0.27685546875, 0.2933349609375, 0.309814453125, 0.3262939453125, 0.3427734375, 0.3592529296875, 0.375732421875, 0.3922119140625, 0.40869140625, 0.4251708984375, 0.441650390625, 0.4581298828125, 0.474609375, 0.4910888671875, 0.507568359375, 0.5240478515625, 0.54052734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 18.0, 25.0, 45.0, 99.0, 134.0, 263.0, 589.0, 1429.0, 4651.0, 23640.0, 858208.0, 142165.0, 12266.0, 3032.0, 1004.0, 440.0, 185.0, 108.0, 72.0, 38.0, 29.0, 23.0, 8.0, 14.0, 5.0, 8.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003113746643066406, -0.0003029182553291321, -0.00029446184635162354, -0.000286005437374115, -0.00027754902839660645, -0.0002690926194190979, -0.00026063621044158936, -0.0002521798014640808, -0.00024372339248657227, -0.00023526698350906372, -0.00022681057453155518, -0.00021835416555404663, -0.00020989775657653809, -0.00020144134759902954, -0.000192984938621521, -0.00018452852964401245, -0.0001760721206665039, -0.00016761571168899536, -0.00015915930271148682, -0.00015070289373397827, -0.00014224648475646973, -0.00013379007577896118, -0.00012533366680145264, -0.00011687725782394409, -0.00010842084884643555, -9.9964439868927e-05, -9.150803089141846e-05, -8.305162191390991e-05, -7.459521293640137e-05, -6.613880395889282e-05, -5.768239498138428e-05, -4.922598600387573e-05, -4.076957702636719e-05, -3.231316804885864e-05, -2.3856759071350098e-05, -1.5400350093841553e-05, -6.943941116333008e-06, 1.5124678611755371e-06, 9.968876838684082e-06, 1.8425285816192627e-05, 2.6881694793701172e-05, 3.533810377120972e-05, 4.379451274871826e-05, 5.225092172622681e-05, 6.070733070373535e-05, 6.91637396812439e-05, 7.762014865875244e-05, 8.607655763626099e-05, 9.453296661376953e-05, 0.00010298937559127808, 0.00011144578456878662, 0.00011990219354629517, 0.0001283586025238037, 0.00013681501150131226, 0.0001452714204788208, 0.00015372782945632935, 0.0001621842384338379, 0.00017064064741134644, 0.00017909705638885498, 0.00018755346536636353, 0.00019600987434387207, 0.00020446628332138062, 0.00021292269229888916, 0.0002213791012763977, 0.00022983551025390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 4.0, 9.0, 12.0, 16.0, 25.0, 25.0, 35.0, 29.0, 37.0, 45.0, 52.0, 102.0, 51.0, 52.0, 64.0, 60.0, 54.0, 56.0, 41.0, 37.0, 36.0, 24.0, 28.0, 22.0, 22.0, 13.0, 11.0, 10.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.8582289814949036e-06, -2.736225724220276e-06, -2.614222466945648e-06, -2.4922192096710205e-06, -2.370215952396393e-06, -2.248212695121765e-06, -2.1262094378471375e-06, -2.0042061805725098e-06, -1.882202923297882e-06, -1.7601996660232544e-06, -1.6381964087486267e-06, -1.516193151473999e-06, -1.3941898941993713e-06, -1.2721866369247437e-06, -1.150183379650116e-06, -1.0281801223754883e-06, -9.061768651008606e-07, -7.841736078262329e-07, -6.621703505516052e-07, -5.401670932769775e-07, -4.1816383600234985e-07, -2.9616057872772217e-07, -1.7415732145309448e-07, -5.21540641784668e-08, 6.984919309616089e-08, 1.9185245037078857e-07, 3.1385570764541626e-07, 4.3585896492004395e-07, 5.578622221946716e-07, 6.798654794692993e-07, 8.01868736743927e-07, 9.238719940185547e-07, 1.0458752512931824e-06, 1.16787850856781e-06, 1.2898817658424377e-06, 1.4118850231170654e-06, 1.5338882803916931e-06, 1.6558915376663208e-06, 1.7778947949409485e-06, 1.8998980522155762e-06, 2.021901309490204e-06, 2.1439045667648315e-06, 2.2659078240394592e-06, 2.387911081314087e-06, 2.5099143385887146e-06, 2.6319175958633423e-06, 2.75392085313797e-06, 2.8759241104125977e-06, 2.9979273676872253e-06, 3.119930624961853e-06, 3.2419338822364807e-06, 3.3639371395111084e-06, 3.485940396785736e-06, 3.6079436540603638e-06, 3.7299469113349915e-06, 3.851950168609619e-06, 3.973953425884247e-06, 4.0959566831588745e-06, 4.217959940433502e-06, 4.33996319770813e-06, 4.4619664549827576e-06, 4.583969712257385e-06, 4.705972969532013e-06, 4.827976226806641e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 6.0, 13.0, 20.0, 10.0, 34.0, 45.0, 70.0, 82.0, 173.0, 319.0, 935.0, 10898.0, 1029226.0, 5264.0, 720.0, 266.0, 157.0, 93.0, 57.0, 45.0, 24.0, 14.0, 18.0, 8.0, 8.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0005025863647460938, -0.00048708170652389526, -0.0004715770483016968, -0.0004560723900794983, -0.0004405677318572998, -0.0004250630736351013, -0.00040955841541290283, -0.00039405375719070435, -0.00037854909896850586, -0.0003630444407463074, -0.0003475397825241089, -0.0003320351243019104, -0.0003165304660797119, -0.00030102580785751343, -0.00028552114963531494, -0.00027001649141311646, -0.00025451183319091797, -0.00023900717496871948, -0.000223502516746521, -0.0002079978585243225, -0.00019249320030212402, -0.00017698854207992554, -0.00016148388385772705, -0.00014597922563552856, -0.00013047456741333008, -0.00011496990919113159, -9.94652509689331e-05, -8.396059274673462e-05, -6.845593452453613e-05, -5.2951276302337646e-05, -3.744661808013916e-05, -2.1941959857940674e-05, -6.4373016357421875e-06, 9.067356586456299e-06, 2.4572014808654785e-05, 4.007667303085327e-05, 5.558133125305176e-05, 7.108598947525024e-05, 8.659064769744873e-05, 0.00010209530591964722, 0.0001175999641418457, 0.0001331046223640442, 0.00014860928058624268, 0.00016411393880844116, 0.00017961859703063965, 0.00019512325525283813, 0.00021062791347503662, 0.0002261325716972351, 0.0002416372299194336, 0.0002571418881416321, 0.00027264654636383057, 0.00028815120458602905, 0.00030365586280822754, 0.000319160521030426, 0.0003346651792526245, 0.000350169837474823, 0.0003656744956970215, 0.00038117915391921997, 0.00039668381214141846, 0.00041218847036361694, 0.00042769312858581543, 0.0004431977868080139, 0.0004587024450302124, 0.0004742071032524109, 0.0004897117614746094]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 4.0, 14.0, 16.0, 24.0, 30.0, 45.0, 57.0, 94.0, 132.0, 153.0, 128.0, 91.0, 58.0, 37.0, 29.0, 19.0, 16.0, 8.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00038361549377441406, -0.00037177279591560364, -0.0003599300980567932, -0.0003480874001979828, -0.00033624470233917236, -0.00032440200448036194, -0.0003125593066215515, -0.0003007166087627411, -0.00028887391090393066, -0.00027703121304512024, -0.0002651885151863098, -0.0002533458173274994, -0.00024150311946868896, -0.00022966042160987854, -0.00021781772375106812, -0.0002059750258922577, -0.00019413232803344727, -0.00018228963017463684, -0.00017044693231582642, -0.000158604234457016, -0.00014676153659820557, -0.00013491883873939514, -0.00012307614088058472, -0.00011123344302177429, -9.939074516296387e-05, -8.754804730415344e-05, -7.570534944534302e-05, -6.386265158653259e-05, -5.201995372772217e-05, -4.017725586891174e-05, -2.833455801010132e-05, -1.6491860151290894e-05, -4.649162292480469e-06, 7.193535566329956e-06, 1.903623342514038e-05, 3.0878931283950806e-05, 4.272162914276123e-05, 5.4564327001571655e-05, 6.640702486038208e-05, 7.82497227191925e-05, 9.009242057800293e-05, 0.00010193511843681335, 0.00011377781629562378, 0.0001256205141544342, 0.00013746321201324463, 0.00014930590987205505, 0.00016114860773086548, 0.0001729913055896759, 0.00018483400344848633, 0.00019667670130729675, 0.00020851939916610718, 0.0002203620970249176, 0.00023220479488372803, 0.00024404749274253845, 0.0002558901906013489, 0.0002677328884601593, 0.0002795755863189697, 0.00029141828417778015, 0.0003032609820365906, 0.000315103679895401, 0.0003269463777542114, 0.00033878907561302185, 0.0003506317734718323, 0.0003624744713306427, 0.0003743171691894531]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 24.0, 110.0, 638.0, 182.0, 27.0, 12.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.165371298789978, -1.0953303575515747, -1.025289535522461, -0.9552485942840576, -0.8852076530456543, -0.8151667714118958, -0.7451258897781372, -0.6750849485397339, -0.6050440669059753, -0.5350031852722168, -0.4649622440338135, -0.39492136240005493, -0.324880450963974, -0.25483953952789307, -0.18479865789413452, -0.11475774645805359, -0.044716835021972656, 0.02532406896352768, 0.09536497294902802, 0.16540586948394775, 0.2354467809200287, 0.3054876923561096, 0.37552857398986816, 0.4455694854259491, 0.51561039686203, 0.5856512784957886, 0.6556922197341919, 0.7257331013679504, 0.795773983001709, 0.8658149242401123, 0.9358558058738708, 1.0058966875076294, 1.0759375095367432, 1.1459784507751465, 1.2160192728042603, 1.2860602140426636, 1.356101155281067, 1.4261419773101807, 1.496182918548584, 1.5662238597869873, 1.6362648010253906, 1.706305742263794, 1.7763465642929077, 1.846387505531311, 1.9164284467697144, 1.9864692687988281, 2.0565102100372314, 2.1265511512756348, 2.196591854095459, 2.2666327953338623, 2.3366737365722656, 2.40671443939209, 2.476755380630493, 2.5467963218688965, 2.6168372631073, 2.686878204345703, 2.7569191455841064, 2.8269600868225098, 2.897001028060913, 2.9670419692993164, 3.0370826721191406, 3.107123613357544, 3.1771645545959473, 3.2472054958343506, 3.317246437072754]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 4.0, 10.0, 12.0, 20.0, 27.0, 24.0, 25.0, 31.0, 33.0, 46.0, 57.0, 57.0, 62.0, 72.0, 62.0, 56.0, 67.0, 48.0, 48.0, 42.0, 34.0, 30.0, 27.0, 33.0, 21.0, 15.0, 5.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.868140697479248, -3.740694284439087, -3.613247871398926, -3.4858012199401855, -3.3583548069000244, -3.2309083938598633, -3.103461742401123, -2.976015329360962, -2.848568916320801, -2.7211225032806396, -2.5936760902404785, -2.4662294387817383, -2.338783025741577, -2.211336612701416, -2.083889961242676, -1.9564435482025146, -1.8289971351623535, -1.7015507221221924, -1.5741041898727417, -1.446657657623291, -1.3192112445831299, -1.1917648315429688, -1.064318299293518, -0.9368718266487122, -0.8094253540039062, -0.6819788813591003, -0.5545324087142944, -0.4270859360694885, -0.2996394634246826, -0.1721929907798767, -0.0447465181350708, 0.08269995450973511, 0.2101459503173828, 0.3375924229621887, 0.46503889560699463, 0.5924853682518005, 0.7199318408966064, 0.8473783135414124, 0.9748247861862183, 1.102271318435669, 1.22971773147583, 1.3571641445159912, 1.484610676765442, 1.6120572090148926, 1.7395036220550537, 1.8669500350952148, 1.9943965673446655, 2.121843099594116, 2.2492895126342773, 2.3767359256744385, 2.5041823387145996, 2.63162899017334, 2.759075403213501, 2.886521816253662, 3.0139684677124023, 3.1414148807525635, 3.2688612937927246, 3.3963077068328857, 3.523754119873047, 3.651200771331787, 3.7786471843719482, 3.9060935974121094, 4.03354024887085, 4.160986423492432, 4.288433074951172]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 5.0, 1.0, 8.0, 13.0, 5.0, 9.0, 19.0, 20.0, 28.0, 28.0, 48.0, 73.0, 379.0, 4818.0, 4177886.0, 9851.0, 703.0, 82.0, 52.0, 49.0, 33.0, 36.0, 22.0, 23.0, 10.0, 13.0, 9.0, 13.0, 10.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4921875, -0.47617340087890625, -0.4601593017578125, -0.44414520263671875, -0.428131103515625, -0.41211700439453125, -0.3961029052734375, -0.38008880615234375, -0.36407470703125, -0.34806060791015625, -0.3320465087890625, -0.31603240966796875, -0.300018310546875, -0.28400421142578125, -0.2679901123046875, -0.25197601318359375, -0.2359619140625, -0.21994781494140625, -0.2039337158203125, -0.18791961669921875, -0.171905517578125, -0.15589141845703125, -0.1398773193359375, -0.12386322021484375, -0.10784912109375, -0.09183502197265625, -0.0758209228515625, -0.05980682373046875, -0.043792724609375, -0.02777862548828125, -0.0117645263671875, 0.00424957275390625, 0.020263671875, 0.03627777099609375, 0.0522918701171875, 0.06830596923828125, 0.084320068359375, 0.10033416748046875, 0.1163482666015625, 0.13236236572265625, 0.14837646484375, 0.16439056396484375, 0.1804046630859375, 0.19641876220703125, 0.212432861328125, 0.22844696044921875, 0.2444610595703125, 0.26047515869140625, 0.2764892578125, 0.29250335693359375, 0.3085174560546875, 0.32453155517578125, 0.340545654296875, 0.35655975341796875, 0.3725738525390625, 0.38858795166015625, 0.40460205078125, 0.42061614990234375, 0.4366302490234375, 0.45264434814453125, 0.468658447265625, 0.48467254638671875, 0.5006866455078125, 0.5167007446289062, 0.53271484375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 7.0, 6.0, 2.0, 4.0, 10.0, 6.0, 9.0, 3.0, 12.0, 24.0, 84.0, 226.0, 321.0, 153.0, 32.0, 12.0, 8.0, 5.0, 8.0, 11.0, 4.0, 3.0, 5.0, 5.0, 5.0, 3.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.176025390625, -0.17029571533203125, -0.1645660400390625, -0.15883636474609375, -0.153106689453125, -0.14737701416015625, -0.1416473388671875, -0.13591766357421875, -0.13018798828125, -0.12445831298828125, -0.1187286376953125, -0.11299896240234375, -0.107269287109375, -0.10153961181640625, -0.0958099365234375, -0.09008026123046875, -0.0843505859375, -0.07862091064453125, -0.0728912353515625, -0.06716156005859375, -0.061431884765625, -0.05570220947265625, -0.0499725341796875, -0.04424285888671875, -0.03851318359375, -0.03278350830078125, -0.0270538330078125, -0.02132415771484375, -0.015594482421875, -0.00986480712890625, -0.0041351318359375, 0.00159454345703125, 0.00732421875, 0.01305389404296875, 0.0187835693359375, 0.02451324462890625, 0.030242919921875, 0.03597259521484375, 0.0417022705078125, 0.04743194580078125, 0.05316162109375, 0.05889129638671875, 0.0646209716796875, 0.07035064697265625, 0.076080322265625, 0.08180999755859375, 0.0875396728515625, 0.09326934814453125, 0.0989990234375, 0.10472869873046875, 0.1104583740234375, 0.11618804931640625, 0.121917724609375, 0.12764739990234375, 0.1333770751953125, 0.13910675048828125, 0.14483642578125, 0.15056610107421875, 0.1562957763671875, 0.16202545166015625, 0.167755126953125, 0.17348480224609375, 0.1792144775390625, 0.18494415283203125, 0.190673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 13.0, 11.0, 26.0, 50.0, 163.0, 544.0, 7215.0, 4183122.0, 2342.0, 478.0, 183.0, 61.0, 21.0, 11.0, 13.0, 13.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66552734375, -0.6477012634277344, -0.6298751831054688, -0.6120491027832031, -0.5942230224609375, -0.5763969421386719, -0.5585708618164062, -0.5407447814941406, -0.522918701171875, -0.5050926208496094, -0.48726654052734375, -0.4694404602050781, -0.4516143798828125, -0.4337882995605469, -0.41596221923828125, -0.3981361389160156, -0.38031005859375, -0.3624839782714844, -0.34465789794921875, -0.3268318176269531, -0.3090057373046875, -0.2911796569824219, -0.27335357666015625, -0.2555274963378906, -0.237701416015625, -0.21987533569335938, -0.20204925537109375, -0.18422317504882812, -0.1663970947265625, -0.14857101440429688, -0.13074493408203125, -0.11291885375976562, -0.0950927734375, -0.07726669311523438, -0.05944061279296875, -0.041614532470703125, -0.0237884521484375, -0.005962371826171875, 0.01186370849609375, 0.029689788818359375, 0.047515869140625, 0.06534194946289062, 0.08316802978515625, 0.10099411010742188, 0.1188201904296875, 0.13664627075195312, 0.15447235107421875, 0.17229843139648438, 0.19012451171875, 0.20795059204101562, 0.22577667236328125, 0.24360275268554688, 0.2614288330078125, 0.2792549133300781, 0.29708099365234375, 0.3149070739746094, 0.332733154296875, 0.3505592346191406, 0.36838531494140625, 0.3862113952636719, 0.4040374755859375, 0.4218635559082031, 0.43968963623046875, 0.4575157165527344, 0.475341796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 14.0, 38.0, 155.0, 3675.0, 116.0, 35.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08447265625, -0.07961654663085938, -0.07476043701171875, -0.06990432739257812, -0.0650482177734375, -0.060192108154296875, -0.05533599853515625, -0.050479888916015625, -0.045623779296875, -0.040767669677734375, -0.03591156005859375, -0.031055450439453125, -0.0261993408203125, -0.021343231201171875, -0.01648712158203125, -0.011631011962890625, -0.00677490234375, -0.001918792724609375, 0.00293731689453125, 0.007793426513671875, 0.0126495361328125, 0.017505645751953125, 0.02236175537109375, 0.027217864990234375, 0.032073974609375, 0.036930084228515625, 0.04178619384765625, 0.046642303466796875, 0.0514984130859375, 0.056354522705078125, 0.06121063232421875, 0.06606674194335938, 0.0709228515625, 0.07577896118164062, 0.08063507080078125, 0.08549118041992188, 0.0903472900390625, 0.09520339965820312, 0.10005950927734375, 0.10491561889648438, 0.109771728515625, 0.11462783813476562, 0.11948394775390625, 0.12434005737304688, 0.1291961669921875, 0.13405227661132812, 0.13890838623046875, 0.14376449584960938, 0.14862060546875, 0.15347671508789062, 0.15833282470703125, 0.16318893432617188, 0.1680450439453125, 0.17290115356445312, 0.17775726318359375, 0.18261337280273438, 0.187469482421875, 0.19232559204101562, 0.19718170166015625, 0.20203781127929688, 0.2068939208984375, 0.21175003051757812, 0.21660614013671875, 0.22146224975585938, 0.226318359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 1006.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3770246505737305, -2.300814390182495, -2.224604368209839, -2.1483941078186035, -2.0721840858459473, -1.995973825454712, -1.9197635650634766, -1.8435534238815308, -1.767343282699585, -1.6911331415176392, -1.6149230003356934, -1.538712739944458, -1.4625025987625122, -1.3862924575805664, -1.310082197189331, -1.2338720560073853, -1.1576619148254395, -1.0814517736434937, -1.0052416324615479, -0.9290313720703125, -0.8528212308883667, -0.7766110897064209, -0.7004008889198303, -0.6241906881332397, -0.547980546951294, -0.47177037596702576, -0.39556020498275757, -0.3193500339984894, -0.2431398630142212, -0.166929692029953, -0.09071952104568481, -0.014509320259094238, 0.06170058250427246, 0.13791075348854065, 0.21412092447280884, 0.290331095457077, 0.3665412664413452, 0.4427514374256134, 0.5189616084098816, 0.5951718091964722, 0.671381950378418, 0.7475920915603638, 0.8238022923469543, 0.9000124931335449, 0.9762226343154907, 1.0524327754974365, 1.1286430358886719, 1.2048531770706177, 1.2810633182525635, 1.3572734594345093, 1.433483600616455, 1.5096938610076904, 1.5859040021896362, 1.662114143371582, 1.7383244037628174, 1.8145345449447632, 1.890744686126709, 1.9669548273086548, 2.0431649684906006, 2.119375228881836, 2.195585250854492, 2.2717955112457275, 2.348005771636963, 2.424215793609619, 2.5004260540008545]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 9.0, 24.0, 42.0, 62.0, 78.0, 111.0, 104.0, 113.0, 117.0, 88.0, 72.0, 80.0, 50.0, 18.0, 11.0, 13.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3936622738838196, -0.38071200251579285, -0.3677617311477661, -0.354811429977417, -0.34186115860939026, -0.3289108872413635, -0.3159606158733368, -0.30301034450531006, -0.29006004333496094, -0.2771097719669342, -0.26415950059890747, -0.25120919942855835, -0.23825892806053162, -0.22530865669250488, -0.21235838532447815, -0.19940811395645142, -0.18645784258842468, -0.17350757122039795, -0.16055728495121002, -0.1476070135831833, -0.13465672731399536, -0.12170645594596863, -0.1087561845779419, -0.09580590575933456, -0.08285562694072723, -0.0699053481221199, -0.05695507302880287, -0.04400479793548584, -0.03105451911687851, -0.01810424029827118, -0.005153968930244446, 0.0077963098883628845, 0.020746588706970215, 0.033696867525577545, 0.04664714261889458, 0.05959741771221161, 0.07254769653081894, 0.08549797534942627, 0.098448246717453, 0.11139852553606033, 0.12434880435466766, 0.1372990757226944, 0.15024936199188232, 0.16319963335990906, 0.1761499047279358, 0.18910019099712372, 0.20205046236515045, 0.21500074863433838, 0.2279510200023651, 0.24090129137039185, 0.2538515627384186, 0.2668018341064453, 0.27975213527679443, 0.29270240664482117, 0.3056526780128479, 0.31860294938087463, 0.33155322074890137, 0.3445034921169281, 0.35745376348495483, 0.37040406465530396, 0.3833543360233307, 0.3963046073913574, 0.40925487875938416, 0.4222051501274109, 0.43515545129776]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 8.0, 9.0, 11.0, 20.0, 31.0, 21.0, 29.0, 38.0, 47.0, 51.0, 63.0, 75.0, 100.0, 133.0, 217.0, 303.0, 462.0, 789.0, 1343.0, 2308.0, 3859.0, 7755.0, 17692.0, 125794.0, 839161.0, 26376.0, 10026.0, 4767.0, 2571.0, 1626.0, 977.0, 614.0, 380.0, 223.0, 156.0, 122.0, 78.0, 68.0, 44.0, 30.0, 27.0, 25.0, 24.0, 18.0, 18.0, 12.0, 11.0, 6.0, 6.0, 4.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2327880859375, -0.22532081604003906, -0.21785354614257812, -0.2103862762451172, -0.20291900634765625, -0.1954517364501953, -0.18798446655273438, -0.18051719665527344, -0.1730499267578125, -0.16558265686035156, -0.15811538696289062, -0.1506481170654297, -0.14318084716796875, -0.1357135772705078, -0.12824630737304688, -0.12077903747558594, -0.113311767578125, -0.10584449768066406, -0.09837722778320312, -0.09090995788574219, -0.08344268798828125, -0.07597541809082031, -0.06850814819335938, -0.06104087829589844, -0.0535736083984375, -0.04610633850097656, -0.038639068603515625, -0.031171798706054688, -0.02370452880859375, -0.016237258911132812, -0.008769989013671875, -0.0013027191162109375, 0.00616455078125, 0.013631820678710938, 0.021099090576171875, 0.028566360473632812, 0.03603363037109375, 0.04350090026855469, 0.050968170166015625, 0.05843544006347656, 0.0659027099609375, 0.07336997985839844, 0.08083724975585938, 0.08830451965332031, 0.09577178955078125, 0.10323905944824219, 0.11070632934570312, 0.11817359924316406, 0.125640869140625, 0.13310813903808594, 0.14057540893554688, 0.1480426788330078, 0.15550994873046875, 0.1629772186279297, 0.17044448852539062, 0.17791175842285156, 0.1853790283203125, 0.19284629821777344, 0.20031356811523438, 0.2077808380126953, 0.21524810791015625, 0.2227153778076172, 0.23018264770507812, 0.23764991760253906, 0.2451171875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 7.0, 6.0, 2.0, 4.0, 10.0, 6.0, 9.0, 3.0, 12.0, 24.0, 87.0, 223.0, 324.0, 150.0, 31.0, 13.0, 8.0, 5.0, 8.0, 11.0, 4.0, 3.0, 5.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.17578125, -0.1700572967529297, -0.16433334350585938, -0.15860939025878906, -0.15288543701171875, -0.14716148376464844, -0.14143753051757812, -0.1357135772705078, -0.1299896240234375, -0.12426567077636719, -0.11854171752929688, -0.11281776428222656, -0.10709381103515625, -0.10136985778808594, -0.09564590454101562, -0.08992195129394531, -0.084197998046875, -0.07847404479980469, -0.07275009155273438, -0.06702613830566406, -0.06130218505859375, -0.05557823181152344, -0.049854278564453125, -0.04413032531738281, -0.0384063720703125, -0.03268241882324219, -0.026958465576171875, -0.021234512329101562, -0.01551055908203125, -0.009786605834960938, -0.004062652587890625, 0.0016613006591796875, 0.00738525390625, 0.013109207153320312, 0.018833160400390625, 0.024557113647460938, 0.03028106689453125, 0.03600502014160156, 0.041728973388671875, 0.04745292663574219, 0.0531768798828125, 0.05890083312988281, 0.06462478637695312, 0.07034873962402344, 0.07607269287109375, 0.08179664611816406, 0.08752059936523438, 0.09324455261230469, 0.098968505859375, 0.10469245910644531, 0.11041641235351562, 0.11614036560058594, 0.12186431884765625, 0.12758827209472656, 0.13331222534179688, 0.1390361785888672, 0.1447601318359375, 0.1504840850830078, 0.15620803833007812, 0.16193199157714844, 0.16765594482421875, 0.17337989807128906, 0.17910385131835938, 0.1848278045654297, 0.1905517578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 2.0, 11.0, 17.0, 10.0, 28.0, 26.0, 32.0, 41.0, 59.0, 83.0, 103.0, 125.0, 195.0, 272.0, 442.0, 872.0, 2727.0, 802102.0, 236948.0, 2237.0, 833.0, 444.0, 222.0, 169.0, 119.0, 94.0, 90.0, 66.0, 42.0, 33.0, 25.0, 22.0, 20.0, 12.0, 6.0, 11.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8564453125, -0.8296356201171875, -0.802825927734375, -0.7760162353515625, -0.74920654296875, -0.7223968505859375, -0.695587158203125, -0.6687774658203125, -0.6419677734375, -0.6151580810546875, -0.588348388671875, -0.5615386962890625, -0.53472900390625, -0.5079193115234375, -0.481109619140625, -0.4542999267578125, -0.427490234375, -0.4006805419921875, -0.373870849609375, -0.3470611572265625, -0.32025146484375, -0.2934417724609375, -0.266632080078125, -0.2398223876953125, -0.2130126953125, -0.1862030029296875, -0.159393310546875, -0.1325836181640625, -0.10577392578125, -0.0789642333984375, -0.052154541015625, -0.0253448486328125, 0.00146484375, 0.0282745361328125, 0.055084228515625, 0.0818939208984375, 0.10870361328125, 0.1355133056640625, 0.162322998046875, 0.1891326904296875, 0.2159423828125, 0.2427520751953125, 0.269561767578125, 0.2963714599609375, 0.32318115234375, 0.3499908447265625, 0.376800537109375, 0.4036102294921875, 0.430419921875, 0.4572296142578125, 0.484039306640625, 0.5108489990234375, 0.53765869140625, 0.5644683837890625, 0.591278076171875, 0.6180877685546875, 0.6448974609375, 0.6717071533203125, 0.698516845703125, 0.7253265380859375, 0.75213623046875, 0.7789459228515625, 0.805755615234375, 0.8325653076171875, 0.859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 8.0, 11.0, 5.0, 15.0, 13.0, 14.0, 22.0, 26.0, 29.0, 30.0, 35.0, 44.0, 46.0, 44.0, 52.0, 61.0, 46.0, 54.0, 50.0, 51.0, 51.0, 34.0, 45.0, 40.0, 33.0, 38.0, 25.0, 19.0, 13.0, 9.0, 12.0, 8.0, 10.0, 0.0, 7.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.612060546875, -0.59228515625, -0.572509765625, -0.552734375, -0.532958984375, -0.51318359375, -0.493408203125, -0.4736328125, -0.453857421875, -0.43408203125, -0.414306640625, -0.39453125, -0.374755859375, -0.35498046875, -0.335205078125, -0.3154296875, -0.295654296875, -0.27587890625, -0.256103515625, -0.236328125, -0.216552734375, -0.19677734375, -0.177001953125, -0.1572265625, -0.137451171875, -0.11767578125, -0.097900390625, -0.078125, -0.058349609375, -0.03857421875, -0.018798828125, 0.0009765625, 0.020751953125, 0.04052734375, 0.060302734375, 0.080078125, 0.099853515625, 0.11962890625, 0.139404296875, 0.1591796875, 0.178955078125, 0.19873046875, 0.218505859375, 0.23828125, 0.258056640625, 0.27783203125, 0.297607421875, 0.3173828125, 0.337158203125, 0.35693359375, 0.376708984375, 0.396484375, 0.416259765625, 0.43603515625, 0.455810546875, 0.4755859375, 0.495361328125, 0.51513671875, 0.534912109375, 0.5546875, 0.574462890625, 0.59423828125, 0.614013671875, 0.6337890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 19.0, 15.0, 27.0, 33.0, 48.0, 60.0, 108.0, 166.0, 215.0, 402.0, 716.0, 1508.0, 3371.0, 8941.0, 30851.0, 201088.0, 716653.0, 60412.0, 14514.0, 4920.0, 2065.0, 984.0, 520.0, 306.0, 206.0, 126.0, 74.0, 51.0, 39.0, 17.0, 16.0, 11.0, 18.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0001608133316040039, -0.00015566125512123108, -0.00015050917863845825, -0.00014535710215568542, -0.0001402050256729126, -0.00013505294919013977, -0.00012990087270736694, -0.00012474879622459412, -0.00011959671974182129, -0.00011444464325904846, -0.00010929256677627563, -0.00010414049029350281, -9.898841381072998e-05, -9.383633732795715e-05, -8.868426084518433e-05, -8.35321843624115e-05, -7.838010787963867e-05, -7.322803139686584e-05, -6.807595491409302e-05, -6.292387843132019e-05, -5.777180194854736e-05, -5.2619725465774536e-05, -4.746764898300171e-05, -4.231557250022888e-05, -3.7163496017456055e-05, -3.201141953468323e-05, -2.68593430519104e-05, -2.1707266569137573e-05, -1.6555190086364746e-05, -1.1403113603591919e-05, -6.251037120819092e-06, -1.0989606380462646e-06, 4.0531158447265625e-06, 9.20519232749939e-06, 1.4357268810272217e-05, 1.9509345293045044e-05, 2.466142177581787e-05, 2.9813498258590698e-05, 3.4965574741363525e-05, 4.011765122413635e-05, 4.526972770690918e-05, 5.042180418968201e-05, 5.5573880672454834e-05, 6.072595715522766e-05, 6.587803363800049e-05, 7.103011012077332e-05, 7.618218660354614e-05, 8.133426308631897e-05, 8.64863395690918e-05, 9.163841605186462e-05, 9.679049253463745e-05, 0.00010194256901741028, 0.0001070946455001831, 0.00011224672198295593, 0.00011739879846572876, 0.0001225508749485016, 0.00012770295143127441, 0.00013285502791404724, 0.00013800710439682007, 0.0001431591808795929, 0.00014831125736236572, 0.00015346333384513855, 0.00015861541032791138, 0.0001637674868106842, 0.00016891956329345703]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 8.0, 20.0, 12.0, 31.0, 37.0, 45.0, 43.0, 97.0, 50.0, 92.0, 91.0, 89.0, 71.0, 71.0, 34.0, 60.0, 41.0, 25.0, 17.0, 12.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.649162292480469e-06, -4.479661583900452e-06, -4.3101608753204346e-06, -4.1406601667404175e-06, -3.9711594581604e-06, -3.8016587495803833e-06, -3.632158041000366e-06, -3.462657332420349e-06, -3.293156623840332e-06, -3.123655915260315e-06, -2.954155206680298e-06, -2.7846544981002808e-06, -2.6151537895202637e-06, -2.4456530809402466e-06, -2.2761523723602295e-06, -2.1066516637802124e-06, -1.9371509552001953e-06, -1.7676502466201782e-06, -1.5981495380401611e-06, -1.428648829460144e-06, -1.259148120880127e-06, -1.0896474123001099e-06, -9.201467037200928e-07, -7.506459951400757e-07, -5.811452865600586e-07, -4.116445779800415e-07, -2.421438694000244e-07, -7.264316082000732e-08, 9.685754776000977e-08, 2.6635825634002686e-07, 4.3585896492004395e-07, 6.05359673500061e-07, 7.748603820800781e-07, 9.443610906600952e-07, 1.1138617992401123e-06, 1.2833625078201294e-06, 1.4528632164001465e-06, 1.6223639249801636e-06, 1.7918646335601807e-06, 1.9613653421401978e-06, 2.130866050720215e-06, 2.300366759300232e-06, 2.469867467880249e-06, 2.639368176460266e-06, 2.808868885040283e-06, 2.9783695936203003e-06, 3.1478703022003174e-06, 3.3173710107803345e-06, 3.4868717193603516e-06, 3.6563724279403687e-06, 3.825873136520386e-06, 3.995373845100403e-06, 4.16487455368042e-06, 4.334375262260437e-06, 4.503875970840454e-06, 4.673376679420471e-06, 4.842877388000488e-06, 5.012378096580505e-06, 5.1818788051605225e-06, 5.3513795137405396e-06, 5.520880222320557e-06, 5.690380930900574e-06, 5.859881639480591e-06, 6.029382348060608e-06, 6.198883056640625e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 4.0, 10.0, 16.0, 13.0, 14.0, 51.0, 41.0, 60.0, 90.0, 145.0, 268.0, 593.0, 2259.0, 1024472.0, 18545.0, 1033.0, 361.0, 178.0, 119.0, 83.0, 53.0, 49.0, 27.0, 20.0, 14.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006399154663085938, -0.0006209537386894226, -0.0006019920110702515, -0.0005830302834510803, -0.0005640685558319092, -0.000545106828212738, -0.0005261451005935669, -0.0005071833729743958, -0.0004882216453552246, -0.00046925991773605347, -0.0004502981901168823, -0.0004313364624977112, -0.00041237473487854004, -0.0003934130072593689, -0.00037445127964019775, -0.0003554895520210266, -0.00033652782440185547, -0.0003175660967826843, -0.0002986043691635132, -0.00027964264154434204, -0.0002606809139251709, -0.00024171918630599976, -0.0002227574586868286, -0.00020379573106765747, -0.00018483400344848633, -0.00016587227582931519, -0.00014691054821014404, -0.0001279488205909729, -0.00010898709297180176, -9.002536535263062e-05, -7.106363773345947e-05, -5.210191011428833e-05, -3.314018249511719e-05, -1.4178454875946045e-05, 4.783272743225098e-06, 2.374500036239624e-05, 4.270672798156738e-05, 6.166845560073853e-05, 8.063018321990967e-05, 9.959191083908081e-05, 0.00011855363845825195, 0.0001375153660774231, 0.00015647709369659424, 0.00017543882131576538, 0.00019440054893493652, 0.00021336227655410767, 0.0002323240041732788, 0.00025128573179244995, 0.0002702474594116211, 0.00028920918703079224, 0.0003081709146499634, 0.0003271326422691345, 0.00034609436988830566, 0.0003650560975074768, 0.00038401782512664795, 0.0004029795527458191, 0.00042194128036499023, 0.0004409030079841614, 0.0004598647356033325, 0.00047882646322250366, 0.0004977881908416748, 0.000516749918460846, 0.0005357116460800171, 0.0005546733736991882, 0.0005736351013183594]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 7.0, 8.0, 5.0, 8.0, 20.0, 20.0, 21.0, 20.0, 22.0, 39.0, 50.0, 76.0, 101.0, 125.0, 131.0, 103.0, 66.0, 38.0, 35.0, 31.0, 20.0, 13.0, 11.0, 12.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004725456237792969, -0.0004596598446369171, -0.00044677406549453735, -0.0004338882863521576, -0.00042100250720977783, -0.00040811672806739807, -0.0003952309489250183, -0.00038234516978263855, -0.0003694593906402588, -0.00035657361149787903, -0.00034368783235549927, -0.0003308020532131195, -0.00031791627407073975, -0.00030503049492836, -0.0002921447157859802, -0.00027925893664360046, -0.0002663731575012207, -0.00025348737835884094, -0.00024060159921646118, -0.00022771582007408142, -0.00021483004093170166, -0.0002019442617893219, -0.00018905848264694214, -0.00017617270350456238, -0.00016328692436218262, -0.00015040114521980286, -0.0001375153660774231, -0.00012462958693504333, -0.00011174380779266357, -9.885802865028381e-05, -8.597224950790405e-05, -7.308647036552429e-05, -6.020069122314453e-05, -4.731491208076477e-05, -3.442913293838501e-05, -2.154335379600525e-05, -8.657574653625488e-06, 4.2282044887542725e-06, 1.7113983631134033e-05, 2.9999762773513794e-05, 4.2885541915893555e-05, 5.5771321058273315e-05, 6.865710020065308e-05, 8.154287934303284e-05, 9.44286584854126e-05, 0.00010731443762779236, 0.00012020021677017212, 0.00013308599591255188, 0.00014597177505493164, 0.0001588575541973114, 0.00017174333333969116, 0.00018462911248207092, 0.00019751489162445068, 0.00021040067076683044, 0.0002232864499092102, 0.00023617222905158997, 0.0002490580081939697, 0.0002619437873363495, 0.00027482956647872925, 0.000287715345621109, 0.00030060112476348877, 0.00031348690390586853, 0.0003263726830482483, 0.00033925846219062805, 0.0003521442413330078]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1000.0, 11.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.616189002990723, -4.132904052734375, -3.649618625640869, -3.1663336753845215, -2.6830484867095947, -2.199763298034668, -1.7164783477783203, -1.2331931591033936, -0.7499079704284668, -0.2666228413581848, 0.21666228771209717, 0.6999473571777344, 1.1832325458526611, 1.666517734527588, 2.1498026847839355, 2.6330878734588623, 3.116373062133789, 3.599658250808716, 4.082943439483643, 4.56622838973999, 5.049513816833496, 5.532798767089844, 6.016083717346191, 6.499368667602539, 6.982654094696045, 7.465939044952393, 7.949224472045898, 8.432509422302246, 8.915794372558594, 9.399080276489258, 9.882364273071289, 10.365650177001953, 10.848936080932617, 11.332221031188965, 11.815505981445312, 12.298791885375977, 12.782076835632324, 13.265361785888672, 13.74864673614502, 14.231931686401367, 14.715217590332031, 15.198502540588379, 15.681787490844727, 16.16507339477539, 16.648357391357422, 17.131643295288086, 17.61492919921875, 18.09821319580078, 18.581497192382812, 19.064783096313477, 19.548067092895508, 20.031352996826172, 20.514636993408203, 20.997922897338867, 21.48120880126953, 21.964492797851562, 22.447778701782227, 22.93106460571289, 23.414348602294922, 23.897634506225586, 24.380918502807617, 24.86420440673828, 25.347488403320312, 25.830774307250977, 26.31406021118164]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 3.0, 10.0, 5.0, 12.0, 13.0, 13.0, 5.0, 26.0, 21.0, 17.0, 33.0, 33.0, 44.0, 32.0, 39.0, 46.0, 46.0, 42.0, 51.0, 57.0, 44.0, 54.0, 49.0, 39.0, 47.0, 27.0, 24.0, 37.0, 28.0, 20.0, 17.0, 13.0, 6.0, 20.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1013424396514893, -2.995605707168579, -2.889868974685669, -2.7841320037841797, -2.6783952713012695, -2.5726585388183594, -2.466921806335449, -2.361185073852539, -2.255448341369629, -2.1497116088867188, -2.0439748764038086, -1.9382380247116089, -1.8325011730194092, -1.726764440536499, -1.6210277080535889, -1.5152909755706787, -1.4095540046691895, -1.3038172721862793, -1.1980804204940796, -1.0923436880111694, -0.9866068959236145, -0.8808701038360596, -0.7751333713531494, -0.6693965792655945, -0.5636597871780396, -0.4579229950904846, -0.3521862328052521, -0.24644947052001953, -0.1407126784324646, -0.03497588634490967, 0.07076084613800049, 0.17649763822555542, 0.28223419189453125, 0.3879709839820862, 0.4937077462673187, 0.5994445085525513, 0.7051813006401062, 0.8109180927276611, 0.9166548252105713, 1.0223915576934814, 1.1281284093856812, 1.2338651418685913, 1.339601993560791, 1.4453387260437012, 1.5510754585266113, 1.656812310218811, 1.7625490427017212, 1.868285894393921, 1.974022626876831, 2.079759359359741, 2.1854960918426514, 2.2912330627441406, 2.396969795227051, 2.502706527709961, 2.608443260192871, 2.7141799926757812, 2.8199167251586914, 2.9256534576416016, 3.0313901901245117, 3.137126922607422, 3.242863893508911, 3.3486006259918213, 3.4543373584747314, 3.5600740909576416, 3.665811061859131]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 6.0, 6.0, 9.0, 12.0, 5.0, 15.0, 15.0, 26.0, 44.0, 124.0, 1396.0, 4187616.0, 4704.0, 89.0, 52.0, 18.0, 16.0, 19.0, 12.0, 10.0, 11.0, 13.0, 6.0, 8.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.978515625, -0.9466400146484375, -0.914764404296875, -0.8828887939453125, -0.85101318359375, -0.8191375732421875, -0.787261962890625, -0.7553863525390625, -0.7235107421875, -0.6916351318359375, -0.659759521484375, -0.6278839111328125, -0.59600830078125, -0.5641326904296875, -0.532257080078125, -0.5003814697265625, -0.468505859375, -0.4366302490234375, -0.404754638671875, -0.3728790283203125, -0.34100341796875, -0.3091278076171875, -0.277252197265625, -0.2453765869140625, -0.2135009765625, -0.1816253662109375, -0.149749755859375, -0.1178741455078125, -0.08599853515625, -0.0541229248046875, -0.022247314453125, 0.0096282958984375, 0.04150390625, 0.0733795166015625, 0.105255126953125, 0.1371307373046875, 0.16900634765625, 0.2008819580078125, 0.232757568359375, 0.2646331787109375, 0.2965087890625, 0.3283843994140625, 0.360260009765625, 0.3921356201171875, 0.42401123046875, 0.4558868408203125, 0.487762451171875, 0.5196380615234375, 0.551513671875, 0.5833892822265625, 0.615264892578125, 0.6471405029296875, 0.67901611328125, 0.7108917236328125, 0.742767333984375, 0.7746429443359375, 0.8065185546875, 0.8383941650390625, 0.870269775390625, 0.9021453857421875, 0.93402099609375, 0.9658966064453125, 0.997772216796875, 1.0296478271484375, 1.0615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 7.0, 4.0, 4.0, 6.0, 9.0, 4.0, 10.0, 6.0, 11.0, 23.0, 100.0, 219.0, 316.0, 147.0, 33.0, 13.0, 6.0, 5.0, 9.0, 9.0, 5.0, 6.0, 4.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1732177734375, -0.1675701141357422, -0.16192245483398438, -0.15627479553222656, -0.15062713623046875, -0.14497947692871094, -0.13933181762695312, -0.1336841583251953, -0.1280364990234375, -0.12238883972167969, -0.11674118041992188, -0.11109352111816406, -0.10544586181640625, -0.09979820251464844, -0.09415054321289062, -0.08850288391113281, -0.082855224609375, -0.07720756530761719, -0.07155990600585938, -0.06591224670410156, -0.06026458740234375, -0.05461692810058594, -0.048969268798828125, -0.04332160949707031, -0.0376739501953125, -0.03202629089355469, -0.026378631591796875, -0.020730972290039062, -0.01508331298828125, -0.009435653686523438, -0.003787994384765625, 0.0018596649169921875, 0.00750732421875, 0.013154983520507812, 0.018802642822265625, 0.024450302124023438, 0.03009796142578125, 0.03574562072753906, 0.041393280029296875, 0.04704093933105469, 0.0526885986328125, 0.05833625793457031, 0.06398391723632812, 0.06963157653808594, 0.07527923583984375, 0.08092689514160156, 0.08657455444335938, 0.09222221374511719, 0.097869873046875, 0.10351753234863281, 0.10916519165039062, 0.11481285095214844, 0.12046051025390625, 0.12610816955566406, 0.13175582885742188, 0.1374034881591797, 0.1430511474609375, 0.1486988067626953, 0.15434646606445312, 0.15999412536621094, 0.16564178466796875, 0.17128944396972656, 0.17693710327148438, 0.1825847625732422, 0.188232421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 3.0, 6.0, 2.0, 8.0, 17.0, 23.0, 29.0, 97.0, 174.0, 632.0, 2682.0, 72399.0, 4111608.0, 5088.0, 1001.0, 286.0, 107.0, 40.0, 23.0, 25.0, 5.0, 3.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2237548828125, -0.21633338928222656, -0.20891189575195312, -0.2014904022216797, -0.19406890869140625, -0.1866474151611328, -0.17922592163085938, -0.17180442810058594, -0.1643829345703125, -0.15696144104003906, -0.14953994750976562, -0.1421184539794922, -0.13469696044921875, -0.1272754669189453, -0.11985397338867188, -0.11243247985839844, -0.105010986328125, -0.09758949279785156, -0.09016799926757812, -0.08274650573730469, -0.07532501220703125, -0.06790351867675781, -0.060482025146484375, -0.05306053161621094, -0.0456390380859375, -0.03821754455566406, -0.030796051025390625, -0.023374557495117188, -0.01595306396484375, -0.008531570434570312, -0.001110076904296875, 0.0063114166259765625, 0.01373291015625, 0.021154403686523438, 0.028575897216796875, 0.03599739074707031, 0.04341888427734375, 0.05084037780761719, 0.058261871337890625, 0.06568336486816406, 0.0731048583984375, 0.08052635192871094, 0.08794784545898438, 0.09536933898925781, 0.10279083251953125, 0.11021232604980469, 0.11763381958007812, 0.12505531311035156, 0.132476806640625, 0.13989830017089844, 0.14731979370117188, 0.1547412872314453, 0.16216278076171875, 0.1695842742919922, 0.17700576782226562, 0.18442726135253906, 0.1918487548828125, 0.19927024841308594, 0.20669174194335938, 0.2141132354736328, 0.22153472900390625, 0.2289562225341797, 0.23637771606445312, 0.24379920959472656, 0.251220703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 12.0, 30.0, 54.0, 148.0, 3241.0, 395.0, 81.0, 38.0, 24.0, 15.0, 5.0, 3.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10882568359375, -0.10560321807861328, -0.10238075256347656, -0.09915828704833984, -0.09593582153320312, -0.0927133560180664, -0.08949089050292969, -0.08626842498779297, -0.08304595947265625, -0.07982349395751953, -0.07660102844238281, -0.0733785629272461, -0.07015609741210938, -0.06693363189697266, -0.06371116638183594, -0.06048870086669922, -0.0572662353515625, -0.05404376983642578, -0.05082130432128906, -0.047598838806152344, -0.044376373291015625, -0.041153907775878906, -0.03793144226074219, -0.03470897674560547, -0.03148651123046875, -0.02826404571533203, -0.025041580200195312, -0.021819114685058594, -0.018596649169921875, -0.015374183654785156, -0.012151718139648438, -0.008929252624511719, -0.005706787109375, -0.0024843215942382812, 0.0007381439208984375, 0.003960609436035156, 0.007183074951171875, 0.010405540466308594, 0.013628005981445312, 0.01685047149658203, 0.02007293701171875, 0.02329540252685547, 0.026517868041992188, 0.029740333557128906, 0.032962799072265625, 0.036185264587402344, 0.03940773010253906, 0.04263019561767578, 0.0458526611328125, 0.04907512664794922, 0.05229759216308594, 0.055520057678222656, 0.058742523193359375, 0.061964988708496094, 0.06518745422363281, 0.06840991973876953, 0.07163238525390625, 0.07485485076904297, 0.07807731628417969, 0.0812997817993164, 0.08452224731445312, 0.08774471282958984, 0.09096717834472656, 0.09418964385986328, 0.097412109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1001.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.955221176147461, -2.8908016681671143, -2.8263821601867676, -2.761962652206421, -2.697543144226074, -2.6331236362457275, -2.568704128265381, -2.504284620285034, -2.4398651123046875, -2.375445604324341, -2.311026096343994, -2.2466065883636475, -2.182187080383301, -2.117767572402954, -2.0533480644226074, -1.9889285564422607, -1.9245091676712036, -1.860089659690857, -1.7956701517105103, -1.7312506437301636, -1.666831135749817, -1.6024116277694702, -1.537992238998413, -1.4735727310180664, -1.4091532230377197, -1.344733715057373, -1.2803142070770264, -1.2158946990966797, -1.151475191116333, -1.0870556831359863, -1.0226361751556396, -0.9582167267799377, -0.8937971591949463, -0.8293776512145996, -0.7649581432342529, -0.7005386352539062, -0.6361191272735596, -0.5716996192932129, -0.507280170917511, -0.4428606629371643, -0.3784411549568176, -0.31402164697647095, -0.24960215389728546, -0.18518266081809998, -0.1207631528377533, -0.056343644857406616, 0.008075833320617676, 0.07249534130096436, 0.13691484928131104, 0.20133435726165771, 0.2657538652420044, 0.3301733434200287, 0.39459285140037537, 0.45901235938072205, 0.5234318375587463, 0.587851345539093, 0.6522708535194397, 0.7166903614997864, 0.7811098694801331, 0.845529317855835, 0.9099488258361816, 0.9743683338165283, 1.038787841796875, 1.1032073497772217, 1.1676268577575684]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 9.0, 7.0, 10.0, 16.0, 15.0, 20.0, 26.0, 28.0, 26.0, 34.0, 42.0, 47.0, 50.0, 39.0, 42.0, 62.0, 46.0, 38.0, 47.0, 47.0, 43.0, 40.0, 40.0, 31.0, 46.0, 32.0, 15.0, 19.0, 16.0, 17.0, 11.0, 7.0, 4.0, 10.0, 8.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15918004512786865, -0.15401114523410797, -0.1488422453403473, -0.1436733603477478, -0.13850446045398712, -0.13333556056022644, -0.12816667556762695, -0.12299777567386627, -0.11782887578010559, -0.11265997588634491, -0.10749108344316483, -0.10232219099998474, -0.09715329110622406, -0.09198439121246338, -0.0868154987692833, -0.08164660632610321, -0.07647770643234253, -0.07130880653858185, -0.06613991409540176, -0.06097101792693138, -0.055802121758461, -0.050633225589990616, -0.04546432942152023, -0.04029543325304985, -0.03512653708457947, -0.029957640916109085, -0.024788744747638702, -0.01961984857916832, -0.014450952410697937, -0.009282056242227554, -0.004113160073757172, 0.001055736094713211, 0.006224632263183594, 0.011393528431653976, 0.01656242460012436, 0.021731320768594742, 0.026900216937065125, 0.03206911310553551, 0.03723800927400589, 0.04240690544247627, 0.047575801610946655, 0.05274469777941704, 0.05791359394788742, 0.0630824863910675, 0.06825138628482819, 0.07342028617858887, 0.07858917862176895, 0.08375807106494904, 0.08892697095870972, 0.0940958708524704, 0.09926476329565048, 0.10443365573883057, 0.10960255563259125, 0.11477145552635193, 0.11994034796953201, 0.1251092404127121, 0.13027814030647278, 0.13544704020023346, 0.14061594009399414, 0.14578482508659363, 0.1509537249803543, 0.156122624874115, 0.16129150986671448, 0.16646040976047516, 0.17162930965423584]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 12.0, 14.0, 19.0, 13.0, 20.0, 25.0, 41.0, 53.0, 75.0, 109.0, 147.0, 255.0, 351.0, 557.0, 824.0, 1387.0, 2388.0, 4585.0, 10122.0, 31360.0, 903407.0, 65848.0, 13553.0, 5636.0, 3034.0, 1652.0, 983.0, 686.0, 449.0, 292.0, 181.0, 108.0, 83.0, 55.0, 44.0, 34.0, 26.0, 25.0, 18.0, 19.0, 13.0, 8.0, 8.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17431640625, -0.16863250732421875, -0.1629486083984375, -0.15726470947265625, -0.151580810546875, -0.14589691162109375, -0.1402130126953125, -0.13452911376953125, -0.12884521484375, -0.12316131591796875, -0.1174774169921875, -0.11179351806640625, -0.106109619140625, -0.10042572021484375, -0.0947418212890625, -0.08905792236328125, -0.0833740234375, -0.07769012451171875, -0.0720062255859375, -0.06632232666015625, -0.060638427734375, -0.05495452880859375, -0.0492706298828125, -0.04358673095703125, -0.03790283203125, -0.03221893310546875, -0.0265350341796875, -0.02085113525390625, -0.015167236328125, -0.00948333740234375, -0.0037994384765625, 0.00188446044921875, 0.007568359375, 0.01325225830078125, 0.0189361572265625, 0.02462005615234375, 0.030303955078125, 0.03598785400390625, 0.0416717529296875, 0.04735565185546875, 0.05303955078125, 0.05872344970703125, 0.0644073486328125, 0.07009124755859375, 0.075775146484375, 0.08145904541015625, 0.0871429443359375, 0.09282684326171875, 0.0985107421875, 0.10419464111328125, 0.1098785400390625, 0.11556243896484375, 0.121246337890625, 0.12693023681640625, 0.1326141357421875, 0.13829803466796875, 0.14398193359375, 0.14966583251953125, 0.1553497314453125, 0.16103363037109375, 0.166717529296875, 0.17240142822265625, 0.1780853271484375, 0.18376922607421875, 0.189453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 5.0, 6.0, 9.0, 4.0, 10.0, 6.0, 11.0, 23.0, 101.0, 225.0, 314.0, 142.0, 34.0, 12.0, 6.0, 5.0, 9.0, 9.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1732177734375, -0.16756820678710938, -0.16191864013671875, -0.15626907348632812, -0.1506195068359375, -0.14496994018554688, -0.13932037353515625, -0.13367080688476562, -0.128021240234375, -0.12237167358398438, -0.11672210693359375, -0.11107254028320312, -0.1054229736328125, -0.09977340698242188, -0.09412384033203125, -0.08847427368164062, -0.08282470703125, -0.07717514038085938, -0.07152557373046875, -0.06587600708007812, -0.0602264404296875, -0.054576873779296875, -0.04892730712890625, -0.043277740478515625, -0.037628173828125, -0.031978607177734375, -0.02632904052734375, -0.020679473876953125, -0.0150299072265625, -0.009380340576171875, -0.00373077392578125, 0.001918792724609375, 0.007568359375, 0.013217926025390625, 0.01886749267578125, 0.024517059326171875, 0.0301666259765625, 0.035816192626953125, 0.04146575927734375, 0.047115325927734375, 0.052764892578125, 0.058414459228515625, 0.06406402587890625, 0.06971359252929688, 0.0753631591796875, 0.08101272583007812, 0.08666229248046875, 0.09231185913085938, 0.09796142578125, 0.10361099243164062, 0.10926055908203125, 0.11491012573242188, 0.1205596923828125, 0.12620925903320312, 0.13185882568359375, 0.13750839233398438, 0.143157958984375, 0.14880752563476562, 0.15445709228515625, 0.16010665893554688, 0.1657562255859375, 0.17140579223632812, 0.17705535888671875, 0.18270492553710938, 0.1883544921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 11.0, 5.0, 17.0, 20.0, 20.0, 27.0, 40.0, 49.0, 56.0, 97.0, 106.0, 142.0, 240.0, 436.0, 838.0, 5130.0, 964904.0, 73064.0, 1703.0, 599.0, 319.0, 167.0, 147.0, 89.0, 77.0, 61.0, 34.0, 29.0, 27.0, 18.0, 16.0, 20.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.46274566650390625, -0.4477081298828125, -0.43267059326171875, -0.417633056640625, -0.40259552001953125, -0.3875579833984375, -0.37252044677734375, -0.35748291015625, -0.34244537353515625, -0.3274078369140625, -0.31237030029296875, -0.297332763671875, -0.28229522705078125, -0.2672576904296875, -0.25222015380859375, -0.2371826171875, -0.22214508056640625, -0.2071075439453125, -0.19207000732421875, -0.177032470703125, -0.16199493408203125, -0.1469573974609375, -0.13191986083984375, -0.11688232421875, -0.10184478759765625, -0.0868072509765625, -0.07176971435546875, -0.056732177734375, -0.04169464111328125, -0.0266571044921875, -0.01161956787109375, 0.00341796875, 0.01845550537109375, 0.0334930419921875, 0.04853057861328125, 0.063568115234375, 0.07860565185546875, 0.0936431884765625, 0.10868072509765625, 0.12371826171875, 0.13875579833984375, 0.1537933349609375, 0.16883087158203125, 0.183868408203125, 0.19890594482421875, 0.2139434814453125, 0.22898101806640625, 0.2440185546875, 0.25905609130859375, 0.2740936279296875, 0.28913116455078125, 0.304168701171875, 0.31920623779296875, 0.3342437744140625, 0.34928131103515625, 0.36431884765625, 0.37935638427734375, 0.3943939208984375, 0.40943145751953125, 0.424468994140625, 0.43950653076171875, 0.4545440673828125, 0.46958160400390625, 0.484619140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 5.0, 15.0, 15.0, 11.0, 19.0, 27.0, 26.0, 22.0, 41.0, 29.0, 47.0, 46.0, 52.0, 52.0, 48.0, 62.0, 33.0, 52.0, 35.0, 31.0, 42.0, 42.0, 37.0, 32.0, 29.0, 19.0, 16.0, 21.0, 14.0, 13.0, 18.0, 3.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.5060195922851562, -0.4895782470703125, -0.47313690185546875, -0.456695556640625, -0.44025421142578125, -0.4238128662109375, -0.40737152099609375, -0.39093017578125, -0.37448883056640625, -0.3580474853515625, -0.34160614013671875, -0.325164794921875, -0.30872344970703125, -0.2922821044921875, -0.27584075927734375, -0.2593994140625, -0.24295806884765625, -0.2265167236328125, -0.21007537841796875, -0.193634033203125, -0.17719268798828125, -0.1607513427734375, -0.14430999755859375, -0.12786865234375, -0.11142730712890625, -0.0949859619140625, -0.07854461669921875, -0.062103271484375, -0.04566192626953125, -0.0292205810546875, -0.01277923583984375, 0.003662109375, 0.02010345458984375, 0.0365447998046875, 0.05298614501953125, 0.069427490234375, 0.08586883544921875, 0.1023101806640625, 0.11875152587890625, 0.13519287109375, 0.15163421630859375, 0.1680755615234375, 0.18451690673828125, 0.200958251953125, 0.21739959716796875, 0.2338409423828125, 0.25028228759765625, 0.2667236328125, 0.28316497802734375, 0.2996063232421875, 0.31604766845703125, 0.332489013671875, 0.34893035888671875, 0.3653717041015625, 0.38181304931640625, 0.39825439453125, 0.41469573974609375, 0.4311370849609375, 0.44757843017578125, 0.464019775390625, 0.48046112060546875, 0.4969024658203125, 0.5133438110351562, 0.52978515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 0.0, 4.0, 9.0, 5.0, 6.0, 7.0, 16.0, 13.0, 23.0, 30.0, 44.0, 67.0, 105.0, 146.0, 279.0, 554.0, 1058.0, 2104.0, 5977.0, 23106.0, 300370.0, 673341.0, 29311.0, 6826.0, 2628.0, 1127.0, 561.0, 289.0, 196.0, 102.0, 65.0, 47.0, 38.0, 38.0, 12.0, 12.0, 13.0, 3.0, 8.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010210275650024414, -9.910576045513153e-05, -9.610876441001892e-05, -9.311176836490631e-05, -9.01147723197937e-05, -8.711777627468109e-05, -8.412078022956848e-05, -8.112378418445587e-05, -7.812678813934326e-05, -7.512979209423065e-05, -7.213279604911804e-05, -6.913580000400543e-05, -6.613880395889282e-05, -6.314180791378021e-05, -6.01448118686676e-05, -5.714781582355499e-05, -5.415081977844238e-05, -5.115382373332977e-05, -4.815682768821716e-05, -4.515983164310455e-05, -4.216283559799194e-05, -3.9165839552879333e-05, -3.6168843507766724e-05, -3.3171847462654114e-05, -3.0174851417541504e-05, -2.7177855372428894e-05, -2.4180859327316284e-05, -2.1183863282203674e-05, -1.8186867237091064e-05, -1.5189871191978455e-05, -1.2192875146865845e-05, -9.195879101753235e-06, -6.198883056640625e-06, -3.201887011528015e-06, -2.0489096641540527e-07, 2.7921050786972046e-06, 5.7891011238098145e-06, 8.786097168922424e-06, 1.1783093214035034e-05, 1.4780089259147644e-05, 1.7777085304260254e-05, 2.0774081349372864e-05, 2.3771077394485474e-05, 2.6768073439598083e-05, 2.9765069484710693e-05, 3.27620655298233e-05, 3.575906157493591e-05, 3.875605762004852e-05, 4.175305366516113e-05, 4.475004971027374e-05, 4.774704575538635e-05, 5.074404180049896e-05, 5.374103784561157e-05, 5.673803389072418e-05, 5.973502993583679e-05, 6.27320259809494e-05, 6.572902202606201e-05, 6.872601807117462e-05, 7.172301411628723e-05, 7.472001016139984e-05, 7.771700620651245e-05, 8.071400225162506e-05, 8.371099829673767e-05, 8.670799434185028e-05, 8.970499038696289e-05]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 9.0, 5.0, 2.0, 8.0, 12.0, 11.0, 14.0, 13.0, 14.0, 19.0, 17.0, 22.0, 40.0, 24.0, 59.0, 63.0, 26.0, 43.0, 49.0, 25.0, 64.0, 56.0, 28.0, 61.0, 19.0, 53.0, 51.0, 12.0, 48.0, 32.0, 16.0, 18.0, 22.0, 4.0, 13.0, 11.0, 2.0, 8.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.337860107421875e-06, -3.2400712370872498e-06, -3.1422823667526245e-06, -3.0444934964179993e-06, -2.946704626083374e-06, -2.8489157557487488e-06, -2.7511268854141235e-06, -2.6533380150794983e-06, -2.555549144744873e-06, -2.457760274410248e-06, -2.3599714040756226e-06, -2.2621825337409973e-06, -2.164393663406372e-06, -2.066604793071747e-06, -1.9688159227371216e-06, -1.8710270524024963e-06, -1.773238182067871e-06, -1.6754493117332458e-06, -1.5776604413986206e-06, -1.4798715710639954e-06, -1.3820827007293701e-06, -1.2842938303947449e-06, -1.1865049600601196e-06, -1.0887160897254944e-06, -9.909272193908691e-07, -8.931383490562439e-07, -7.953494787216187e-07, -6.975606083869934e-07, -5.997717380523682e-07, -5.019828677177429e-07, -4.041939973831177e-07, -3.0640512704849243e-07, -2.086162567138672e-07, -1.1082738637924194e-07, -1.30385160446167e-08, 8.475035429000854e-08, 1.825392246246338e-07, 2.8032809495925903e-07, 3.781169652938843e-07, 4.759058356285095e-07, 5.736947059631348e-07, 6.7148357629776e-07, 7.692724466323853e-07, 8.670613169670105e-07, 9.648501873016357e-07, 1.062639057636261e-06, 1.1604279279708862e-06, 1.2582167983055115e-06, 1.3560056686401367e-06, 1.453794538974762e-06, 1.5515834093093872e-06, 1.6493722796440125e-06, 1.7471611499786377e-06, 1.844950020313263e-06, 1.942738890647888e-06, 2.0405277609825134e-06, 2.1383166313171387e-06, 2.236105501651764e-06, 2.333894371986389e-06, 2.4316832423210144e-06, 2.5294721126556396e-06, 2.627260982990265e-06, 2.72504985332489e-06, 2.8228387236595154e-06, 2.9206275939941406e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 13.0, 15.0, 17.0, 28.0, 55.0, 73.0, 134.0, 201.0, 390.0, 2165.0, 987293.0, 56164.0, 1157.0, 344.0, 192.0, 90.0, 54.0, 42.0, 27.0, 16.0, 17.0, 12.0, 6.0, 6.0, 1.0, 6.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002613067626953125, -0.0002522505819797516, -0.00024319440126419067, -0.00023413822054862976, -0.00022508203983306885, -0.00021602585911750793, -0.00020696967840194702, -0.0001979134976863861, -0.0001888573169708252, -0.00017980113625526428, -0.00017074495553970337, -0.00016168877482414246, -0.00015263259410858154, -0.00014357641339302063, -0.00013452023267745972, -0.0001254640519618988, -0.00011640787124633789, -0.00010735169053077698, -9.829550981521606e-05, -8.923932909965515e-05, -8.018314838409424e-05, -7.112696766853333e-05, -6.207078695297241e-05, -5.30146062374115e-05, -4.3958425521850586e-05, -3.490224480628967e-05, -2.584606409072876e-05, -1.6789883375167847e-05, -7.733702659606934e-06, 1.3224780559539795e-06, 1.0378658771514893e-05, 1.9434839487075806e-05, 2.849102020263672e-05, 3.754720091819763e-05, 4.6603381633758545e-05, 5.565956234931946e-05, 6.471574306488037e-05, 7.377192378044128e-05, 8.28281044960022e-05, 9.188428521156311e-05, 0.00010094046592712402, 0.00010999664664268494, 0.00011905282735824585, 0.00012810900807380676, 0.00013716518878936768, 0.0001462213695049286, 0.0001552775502204895, 0.00016433373093605042, 0.00017338991165161133, 0.00018244609236717224, 0.00019150227308273315, 0.00020055845379829407, 0.00020961463451385498, 0.0002186708152294159, 0.0002277269959449768, 0.00023678317666053772, 0.00024583935737609863, 0.00025489553809165955, 0.00026395171880722046, 0.00027300789952278137, 0.0002820640802383423, 0.0002911202609539032, 0.0003001764416694641, 0.000309232622385025, 0.00031828880310058594]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 17.0, 34.0, 34.0, 45.0, 55.0, 78.0, 84.0, 143.0, 110.0, 100.0, 68.0, 57.0, 28.0, 25.0, 24.0, 18.0, 13.0, 7.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000286102294921875, -0.0002761855721473694, -0.00026626884937286377, -0.00025635212659835815, -0.00024643540382385254, -0.00023651868104934692, -0.0002266019582748413, -0.0002166852355003357, -0.00020676851272583008, -0.00019685178995132446, -0.00018693506717681885, -0.00017701834440231323, -0.00016710162162780762, -0.000157184898853302, -0.0001472681760787964, -0.00013735145330429077, -0.00012743473052978516, -0.00011751800775527954, -0.00010760128498077393, -9.768456220626831e-05, -8.77678394317627e-05, -7.785111665725708e-05, -6.793439388275146e-05, -5.801767110824585e-05, -4.8100948333740234e-05, -3.818422555923462e-05, -2.8267502784729004e-05, -1.835078001022339e-05, -8.434057235717773e-06, 1.4826655387878418e-06, 1.1399388313293457e-05, 2.1316111087799072e-05, 3.123283386230469e-05, 4.11495566368103e-05, 5.106627941131592e-05, 6.098300218582153e-05, 7.089972496032715e-05, 8.081644773483276e-05, 9.073317050933838e-05, 0.000100649893283844, 0.00011056661605834961, 0.00012048333883285522, 0.00013040006160736084, 0.00014031678438186646, 0.00015023350715637207, 0.00016015022993087769, 0.0001700669527053833, 0.00017998367547988892, 0.00018990039825439453, 0.00019981712102890015, 0.00020973384380340576, 0.00021965056657791138, 0.000229567289352417, 0.0002394840121269226, 0.0002494007349014282, 0.00025931745767593384, 0.00026923418045043945, 0.00027915090322494507, 0.0002890676259994507, 0.0002989843487739563, 0.0003089010715484619, 0.00031881779432296753, 0.00032873451709747314, 0.00033865123987197876, 0.0003485679626464844]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 22.0, 157.0, 766.0, 58.0, 7.0, 4.0, 2.0], "bins": [-6.434990882873535, -6.3264875411987305, -6.217984199523926, -6.109480857849121, -6.000977993011475, -5.89247465133667, -5.783971309661865, -5.6754679679870605, -5.566964626312256, -5.458461284637451, -5.3499579429626465, -5.241455078125, -5.132951736450195, -5.024448394775391, -4.915945053100586, -4.807441711425781, -4.698938369750977, -4.590435028076172, -4.481931686401367, -4.3734283447265625, -4.264925479888916, -4.156422138214111, -4.047918796539307, -3.939415454864502, -3.8309125900268555, -3.722409248352051, -3.613906145095825, -3.5054028034210205, -3.396899461746216, -3.2883963584899902, -3.1798930168151855, -3.071389675140381, -2.9628865718841553, -2.8543832302093506, -2.745880126953125, -2.6373767852783203, -2.5288734436035156, -2.420370101928711, -2.3118669986724854, -2.2033636569976807, -2.094860315322876, -1.9863570928573608, -1.8778537511825562, -1.769350528717041, -1.6608471870422363, -1.5523439645767212, -1.443840742111206, -1.3353374004364014, -1.2268342971801758, -1.1183310747146606, -1.009827733039856, -0.9013245105743408, -0.7928212285041809, -0.684317946434021, -0.5758147239685059, -0.46731144189834595, -0.35880810022354126, -0.25030481815338135, -0.14180156588554382, -0.0332983136177063, 0.07520496845245361, 0.18370825052261353, 0.29221147298812866, 0.4007147550582886, 0.5092180371284485]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 3.0, 4.0, 8.0, 7.0, 13.0, 13.0, 11.0, 17.0, 26.0, 23.0, 29.0, 23.0, 41.0, 28.0, 33.0, 32.0, 52.0, 47.0, 47.0, 39.0, 41.0, 61.0, 42.0, 41.0, 36.0, 43.0, 39.0, 31.0, 31.0, 18.0, 27.0, 16.0, 15.0, 17.0, 11.0, 7.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.9752357006073, -2.895128011703491, -2.8150203227996826, -2.734912633895874, -2.6548049449920654, -2.574697494506836, -2.4945898056030273, -2.4144821166992188, -2.33437442779541, -2.2542667388916016, -2.174159049987793, -2.0940513610839844, -2.013943672180176, -1.9338361024856567, -1.8537284135818481, -1.773620843887329, -1.693513035774231, -1.6134053468704224, -1.5332976579666138, -1.4531900882720947, -1.3730823993682861, -1.2929747104644775, -1.212867021560669, -1.1327593326568604, -1.0526516437530518, -0.9725439548492432, -0.8924363255500793, -0.8123286366462708, -0.7322210073471069, -0.6521133184432983, -0.5720056295394897, -0.4918980002403259, -0.4117903709411621, -0.3316827118396759, -0.2515750527381897, -0.1714673638343811, -0.0913597047328949, -0.011252045631408691, 0.0688556432723999, 0.14896327257156372, 0.22907096147537231, 0.3091786205768585, 0.3892862796783447, 0.4693939685821533, 0.5495016574859619, 0.6296092867851257, 0.7097169756889343, 0.7898246049880981, 0.8699322938919067, 0.9500399827957153, 1.030147671699524, 1.110255241394043, 1.1903629302978516, 1.2704706192016602, 1.3505783081054688, 1.4306859970092773, 1.510793685913086, 1.5909013748168945, 1.6710090637207031, 1.7511167526245117, 1.8312243223190308, 1.9113320112228394, 1.991439700126648, 2.071547269821167, 2.1516549587249756]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 10.0, 5.0, 5.0, 8.0, 12.0, 7.0, 14.0, 15.0, 26.0, 45.0, 135.0, 597.0, 4192526.0, 649.0, 48.0, 29.0, 19.0, 13.0, 18.0, 16.0, 7.0, 12.0, 11.0, 8.0, 8.0, 2.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3173828125, -1.274322509765625, -1.23126220703125, -1.188201904296875, -1.1451416015625, -1.102081298828125, -1.05902099609375, -1.015960693359375, -0.972900390625, -0.929840087890625, -0.88677978515625, -0.843719482421875, -0.8006591796875, -0.757598876953125, -0.71453857421875, -0.671478271484375, -0.62841796875, -0.585357666015625, -0.54229736328125, -0.499237060546875, -0.4561767578125, -0.413116455078125, -0.37005615234375, -0.326995849609375, -0.283935546875, -0.240875244140625, -0.19781494140625, -0.154754638671875, -0.1116943359375, -0.068634033203125, -0.02557373046875, 0.017486572265625, 0.060546875, 0.103607177734375, 0.14666748046875, 0.189727783203125, 0.2327880859375, 0.275848388671875, 0.31890869140625, 0.361968994140625, 0.405029296875, 0.448089599609375, 0.49114990234375, 0.534210205078125, 0.5772705078125, 0.620330810546875, 0.66339111328125, 0.706451416015625, 0.74951171875, 0.792572021484375, 0.83563232421875, 0.878692626953125, 0.9217529296875, 0.964813232421875, 1.00787353515625, 1.050933837890625, 1.093994140625, 1.137054443359375, 1.18011474609375, 1.223175048828125, 1.2662353515625, 1.309295654296875, 1.35235595703125, 1.395416259765625, 1.4384765625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 4.0, 4.0, 6.0, 8.0, 5.0, 9.0, 6.0, 14.0, 27.0, 114.0, 241.0, 293.0, 131.0, 30.0, 12.0, 6.0, 6.0, 9.0, 9.0, 4.0, 6.0, 4.0, 5.0, 5.0, 2.0, 7.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.171142578125, -0.16554641723632812, -0.15995025634765625, -0.15435409545898438, -0.1487579345703125, -0.14316177368164062, -0.13756561279296875, -0.13196945190429688, -0.126373291015625, -0.12077713012695312, -0.11518096923828125, -0.10958480834960938, -0.1039886474609375, -0.09839248657226562, -0.09279632568359375, -0.08720016479492188, -0.08160400390625, -0.07600784301757812, -0.07041168212890625, -0.06481552124023438, -0.0592193603515625, -0.053623199462890625, -0.04802703857421875, -0.042430877685546875, -0.036834716796875, -0.031238555908203125, -0.02564239501953125, -0.020046234130859375, -0.0144500732421875, -0.008853912353515625, -0.00325775146484375, 0.002338409423828125, 0.0079345703125, 0.013530731201171875, 0.01912689208984375, 0.024723052978515625, 0.0303192138671875, 0.035915374755859375, 0.04151153564453125, 0.047107696533203125, 0.052703857421875, 0.058300018310546875, 0.06389617919921875, 0.06949234008789062, 0.0750885009765625, 0.08068466186523438, 0.08628082275390625, 0.09187698364257812, 0.09747314453125, 0.10306930541992188, 0.10866546630859375, 0.11426162719726562, 0.1198577880859375, 0.12545394897460938, 0.13105010986328125, 0.13664627075195312, 0.142242431640625, 0.14783859252929688, 0.15343475341796875, 0.15903091430664062, 0.1646270751953125, 0.17022323608398438, 0.17581939697265625, 0.18141555786132812, 0.18701171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 20.0, 31.0, 105.0, 372.0, 1057.0, 41227.0, 4149363.0, 1363.0, 491.0, 156.0, 57.0, 16.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.42041015625, -0.4090690612792969, -0.39772796630859375, -0.3863868713378906, -0.3750457763671875, -0.3637046813964844, -0.35236358642578125, -0.3410224914550781, -0.329681396484375, -0.3183403015136719, -0.30699920654296875, -0.2956581115722656, -0.2843170166015625, -0.2729759216308594, -0.26163482666015625, -0.2502937316894531, -0.23895263671875, -0.22761154174804688, -0.21627044677734375, -0.20492935180664062, -0.1935882568359375, -0.18224716186523438, -0.17090606689453125, -0.15956497192382812, -0.148223876953125, -0.13688278198242188, -0.12554168701171875, -0.11420059204101562, -0.1028594970703125, -0.09151840209960938, -0.08017730712890625, -0.06883621215820312, -0.0574951171875, -0.046154022216796875, -0.03481292724609375, -0.023471832275390625, -0.0121307373046875, -0.000789642333984375, 0.01055145263671875, 0.021892547607421875, 0.033233642578125, 0.044574737548828125, 0.05591583251953125, 0.06725692749023438, 0.0785980224609375, 0.08993911743164062, 0.10128021240234375, 0.11262130737304688, 0.12396240234375, 0.13530349731445312, 0.14664459228515625, 0.15798568725585938, 0.1693267822265625, 0.18066787719726562, 0.19200897216796875, 0.20335006713867188, 0.214691162109375, 0.22603225708007812, 0.23737335205078125, 0.24871444702148438, 0.2600555419921875, 0.2713966369628906, 0.28273773193359375, 0.2940788269042969, 0.305419921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 9.0, 16.0, 32.0, 3867.0, 116.0, 16.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0986328125, -0.094940185546875, -0.09124755859375, -0.087554931640625, -0.0838623046875, -0.080169677734375, -0.07647705078125, -0.072784423828125, -0.069091796875, -0.065399169921875, -0.06170654296875, -0.058013916015625, -0.0543212890625, -0.050628662109375, -0.04693603515625, -0.043243408203125, -0.03955078125, -0.035858154296875, -0.03216552734375, -0.028472900390625, -0.0247802734375, -0.021087646484375, -0.01739501953125, -0.013702392578125, -0.010009765625, -0.006317138671875, -0.00262451171875, 0.001068115234375, 0.0047607421875, 0.008453369140625, 0.01214599609375, 0.015838623046875, 0.01953125, 0.023223876953125, 0.02691650390625, 0.030609130859375, 0.0343017578125, 0.037994384765625, 0.04168701171875, 0.045379638671875, 0.049072265625, 0.052764892578125, 0.05645751953125, 0.060150146484375, 0.0638427734375, 0.067535400390625, 0.07122802734375, 0.074920654296875, 0.07861328125, 0.082305908203125, 0.08599853515625, 0.089691162109375, 0.0933837890625, 0.097076416015625, 0.10076904296875, 0.104461669921875, 0.108154296875, 0.111846923828125, 0.11553955078125, 0.119232177734375, 0.1229248046875, 0.126617431640625, 0.13031005859375, 0.134002685546875, 0.1376953125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 247.0, 761.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18416857719421387, -0.17338396608829498, -0.1625993549823761, -0.1518147587776184, -0.14103014767169952, -0.13024553656578064, -0.11946093291044235, -0.10867632925510406, -0.09789171814918518, -0.0871071070432663, -0.07632250338792801, -0.06553789973258972, -0.05475328862667084, -0.04396868124604225, -0.033184073865413666, -0.02239947021007538, -0.011614859104156494, -0.0008302517235279083, 0.009954355657100677, 0.020738963037729263, 0.03152357041835785, 0.042308177798986435, 0.05309278517961502, 0.06387738883495331, 0.07466199994087219, 0.08544661104679108, 0.09623121470212936, 0.10701581835746765, 0.11780042946338654, 0.12858504056930542, 0.1393696367740631, 0.150154247879982, 0.16093885898590088, 0.17172347009181976, 0.18250808119773865, 0.19329267740249634, 0.20407728850841522, 0.2148618996143341, 0.2256464958190918, 0.23643110692501068, 0.24721571803092957, 0.25800031423568726, 0.26878494024276733, 0.279569536447525, 0.2903541326522827, 0.3011387586593628, 0.3119233548641205, 0.3227079510688782, 0.33349257707595825, 0.34427717328071594, 0.355061799287796, 0.3658463954925537, 0.3766310214996338, 0.3874156177043915, 0.39820021390914917, 0.40898483991622925, 0.41976943612098694, 0.43055403232574463, 0.4413386583328247, 0.4521232545375824, 0.4629078507423401, 0.47369247674942017, 0.48447707295417786, 0.49526166915893555, 0.5060462951660156]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 6.0, 4.0, 9.0, 5.0, 5.0, 9.0, 10.0, 11.0, 12.0, 23.0, 20.0, 31.0, 29.0, 28.0, 43.0, 37.0, 33.0, 38.0, 41.0, 47.0, 42.0, 42.0, 39.0, 43.0, 48.0, 35.0, 29.0, 39.0, 30.0, 32.0, 23.0, 23.0, 29.0, 16.0, 23.0, 11.0, 11.0, 6.0, 12.0, 6.0, 5.0, 1.0, 5.0, 6.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10939860343933105, -0.10604093968868256, -0.10268327593803406, -0.09932560473680496, -0.09596794098615646, -0.09261027723550797, -0.08925260603427887, -0.08589494228363037, -0.08253727853298187, -0.07917961478233337, -0.07582195103168488, -0.07246427983045578, -0.06910661607980728, -0.06574895232915878, -0.062391284853219986, -0.05903361737728119, -0.05567595362663269, -0.05231828987598419, -0.048960622400045395, -0.0456029549241066, -0.0422452911734581, -0.0388876274228096, -0.035529959946870804, -0.03217229247093201, -0.02881462872028351, -0.02545696310698986, -0.022099297493696213, -0.018741631880402565, -0.015383966267108917, -0.01202630065381527, -0.008668635040521622, -0.005310969427227974, -0.001953303813934326, 0.0014043617993593216, 0.004762027412652969, 0.008119693025946617, 0.011477358639240265, 0.014835024252533913, 0.01819268986582756, 0.021550355479121208, 0.024908021092414856, 0.028265686705708504, 0.03162335231900215, 0.03498101979494095, 0.03833868354558945, 0.041696347296237946, 0.04505401477217674, 0.04841168224811554, 0.05176934599876404, 0.05512700974941254, 0.058484677225351334, 0.06184234470129013, 0.06520000845193863, 0.06855767220258713, 0.07191534340381622, 0.07527300715446472, 0.07863067090511322, 0.08198833465576172, 0.08534599840641022, 0.08870366960763931, 0.09206133335828781, 0.09541899710893631, 0.0987766683101654, 0.1021343320608139, 0.1054919958114624]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 7.0, 13.0, 27.0, 27.0, 37.0, 51.0, 65.0, 101.0, 156.0, 186.0, 289.0, 408.0, 639.0, 831.0, 1366.0, 2072.0, 3426.0, 6026.0, 12505.0, 41361.0, 883967.0, 63056.0, 14412.0, 6955.0, 3833.0, 2352.0, 1393.0, 938.0, 600.0, 393.0, 317.0, 195.0, 161.0, 103.0, 75.0, 62.0, 33.0, 24.0, 23.0, 18.0, 5.0, 7.0, 7.0, 13.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.157470703125, -0.15232276916503906, -0.14717483520507812, -0.1420269012451172, -0.13687896728515625, -0.1317310333251953, -0.12658309936523438, -0.12143516540527344, -0.1162872314453125, -0.11113929748535156, -0.10599136352539062, -0.10084342956542969, -0.09569549560546875, -0.09054756164550781, -0.08539962768554688, -0.08025169372558594, -0.075103759765625, -0.06995582580566406, -0.06480789184570312, -0.05965995788574219, -0.05451202392578125, -0.04936408996582031, -0.044216156005859375, -0.03906822204589844, -0.0339202880859375, -0.028772354125976562, -0.023624420166015625, -0.018476486206054688, -0.01332855224609375, -0.008180618286132812, -0.003032684326171875, 0.0021152496337890625, 0.00726318359375, 0.012411117553710938, 0.017559051513671875, 0.022706985473632812, 0.02785491943359375, 0.03300285339355469, 0.038150787353515625, 0.04329872131347656, 0.0484466552734375, 0.05359458923339844, 0.058742523193359375, 0.06389045715332031, 0.06903839111328125, 0.07418632507324219, 0.07933425903320312, 0.08448219299316406, 0.089630126953125, 0.09477806091308594, 0.09992599487304688, 0.10507392883300781, 0.11022186279296875, 0.11536979675292969, 0.12051773071289062, 0.12566566467285156, 0.1308135986328125, 0.13596153259277344, 0.14110946655273438, 0.1462574005126953, 0.15140533447265625, 0.1565532684326172, 0.16170120239257812, 0.16684913635253906, 0.1719970703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 4.0, 4.0, 6.0, 8.0, 5.0, 9.0, 6.0, 14.0, 29.0, 111.0, 241.0, 290.0, 134.0, 31.0, 12.0, 7.0, 5.0, 8.0, 10.0, 4.0, 6.0, 4.0, 5.0, 5.0, 2.0, 7.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.171142578125, -0.16554641723632812, -0.15995025634765625, -0.15435409545898438, -0.1487579345703125, -0.14316177368164062, -0.13756561279296875, -0.13196945190429688, -0.126373291015625, -0.12077713012695312, -0.11518096923828125, -0.10958480834960938, -0.1039886474609375, -0.09839248657226562, -0.09279632568359375, -0.08720016479492188, -0.08160400390625, -0.07600784301757812, -0.07041168212890625, -0.06481552124023438, -0.0592193603515625, -0.053623199462890625, -0.04802703857421875, -0.042430877685546875, -0.036834716796875, -0.031238555908203125, -0.02564239501953125, -0.020046234130859375, -0.0144500732421875, -0.008853912353515625, -0.00325775146484375, 0.002338409423828125, 0.0079345703125, 0.013530731201171875, 0.01912689208984375, 0.024723052978515625, 0.0303192138671875, 0.035915374755859375, 0.04151153564453125, 0.047107696533203125, 0.052703857421875, 0.058300018310546875, 0.06389617919921875, 0.06949234008789062, 0.0750885009765625, 0.08068466186523438, 0.08628082275390625, 0.09187698364257812, 0.09747314453125, 0.10306930541992188, 0.10866546630859375, 0.11426162719726562, 0.1198577880859375, 0.12545394897460938, 0.13105010986328125, 0.13664627075195312, 0.142242431640625, 0.14783859252929688, 0.15343475341796875, 0.15903091430664062, 0.1646270751953125, 0.17022323608398438, 0.17581939697265625, 0.18141555786132812, 0.18701171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 8.0, 5.0, 12.0, 14.0, 20.0, 16.0, 34.0, 43.0, 49.0, 43.0, 62.0, 111.0, 132.0, 230.0, 360.0, 677.0, 2481.0, 107391.0, 927062.0, 7398.0, 1039.0, 438.0, 284.0, 155.0, 111.0, 79.0, 68.0, 40.0, 36.0, 28.0, 27.0, 21.0, 19.0, 21.0, 11.0, 7.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38232421875, -0.36876678466796875, -0.3552093505859375, -0.34165191650390625, -0.328094482421875, -0.31453704833984375, -0.3009796142578125, -0.28742218017578125, -0.27386474609375, -0.26030731201171875, -0.2467498779296875, -0.23319244384765625, -0.219635009765625, -0.20607757568359375, -0.1925201416015625, -0.17896270751953125, -0.1654052734375, -0.15184783935546875, -0.1382904052734375, -0.12473297119140625, -0.111175537109375, -0.09761810302734375, -0.0840606689453125, -0.07050323486328125, -0.05694580078125, -0.04338836669921875, -0.0298309326171875, -0.01627349853515625, -0.002716064453125, 0.01084136962890625, 0.0243988037109375, 0.03795623779296875, 0.051513671875, 0.06507110595703125, 0.0786285400390625, 0.09218597412109375, 0.105743408203125, 0.11930084228515625, 0.1328582763671875, 0.14641571044921875, 0.15997314453125, 0.17353057861328125, 0.1870880126953125, 0.20064544677734375, 0.214202880859375, 0.22776031494140625, 0.2413177490234375, 0.25487518310546875, 0.2684326171875, 0.28199005126953125, 0.2955474853515625, 0.30910491943359375, 0.322662353515625, 0.33621978759765625, 0.3497772216796875, 0.36333465576171875, 0.37689208984375, 0.39044952392578125, 0.4040069580078125, 0.41756439208984375, 0.431121826171875, 0.44467926025390625, 0.4582366943359375, 0.47179412841796875, 0.4853515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 7.0, 4.0, 7.0, 11.0, 12.0, 11.0, 19.0, 27.0, 27.0, 17.0, 27.0, 42.0, 36.0, 45.0, 53.0, 45.0, 37.0, 48.0, 38.0, 47.0, 58.0, 41.0, 48.0, 31.0, 46.0, 31.0, 32.0, 26.0, 17.0, 16.0, 21.0, 14.0, 12.0, 15.0, 9.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.450439453125, -0.4344673156738281, -0.41849517822265625, -0.4025230407714844, -0.3865509033203125, -0.3705787658691406, -0.35460662841796875, -0.3386344909667969, -0.322662353515625, -0.3066902160644531, -0.29071807861328125, -0.2747459411621094, -0.2587738037109375, -0.24280166625976562, -0.22682952880859375, -0.21085739135742188, -0.19488525390625, -0.17891311645507812, -0.16294097900390625, -0.14696884155273438, -0.1309967041015625, -0.11502456665039062, -0.09905242919921875, -0.08308029174804688, -0.067108154296875, -0.051136016845703125, -0.03516387939453125, -0.019191741943359375, -0.0032196044921875, 0.012752532958984375, 0.02872467041015625, 0.044696807861328125, 0.0606689453125, 0.07664108276367188, 0.09261322021484375, 0.10858535766601562, 0.1245574951171875, 0.14052963256835938, 0.15650177001953125, 0.17247390747070312, 0.188446044921875, 0.20441818237304688, 0.22039031982421875, 0.23636245727539062, 0.2523345947265625, 0.2683067321777344, 0.28427886962890625, 0.3002510070800781, 0.31622314453125, 0.3321952819824219, 0.34816741943359375, 0.3641395568847656, 0.3801116943359375, 0.3960838317871094, 0.41205596923828125, 0.4280281066894531, 0.444000244140625, 0.4599723815917969, 0.47594451904296875, 0.4919166564941406, 0.5078887939453125, 0.5238609313964844, 0.5398330688476562, 0.5558052062988281, 0.57177734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 11.0, 16.0, 13.0, 31.0, 37.0, 69.0, 86.0, 152.0, 248.0, 363.0, 616.0, 1223.0, 2557.0, 6497.0, 32992.0, 921287.0, 67328.0, 8719.0, 3025.0, 1356.0, 749.0, 429.0, 264.0, 169.0, 105.0, 64.0, 51.0, 26.0, 16.0, 13.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.480382919311523e-05, -7.236097007989883e-05, -6.991811096668243e-05, -6.747525185346603e-05, -6.503239274024963e-05, -6.258953362703323e-05, -6.0146674513816833e-05, -5.770381540060043e-05, -5.526095628738403e-05, -5.281809717416763e-05, -5.037523806095123e-05, -4.793237894773483e-05, -4.548951983451843e-05, -4.304666072130203e-05, -4.060380160808563e-05, -3.816094249486923e-05, -3.571808338165283e-05, -3.327522426843643e-05, -3.083236515522003e-05, -2.838950604200363e-05, -2.594664692878723e-05, -2.350378781557083e-05, -2.106092870235443e-05, -1.861806958913803e-05, -1.617521047592163e-05, -1.373235136270523e-05, -1.128949224948883e-05, -8.84663313627243e-06, -6.40377402305603e-06, -3.96091490983963e-06, -1.51805579662323e-06, 9.248033165931702e-07, 3.3676624298095703e-06, 5.8105215430259705e-06, 8.25338065624237e-06, 1.069623976945877e-05, 1.3139098882675171e-05, 1.558195799589157e-05, 1.802481710910797e-05, 2.046767622232437e-05, 2.291053533554077e-05, 2.535339444875717e-05, 2.7796253561973572e-05, 3.0239112675189972e-05, 3.268197178840637e-05, 3.512483090162277e-05, 3.756769001483917e-05, 4.001054912805557e-05, 4.245340824127197e-05, 4.489626735448837e-05, 4.733912646770477e-05, 4.978198558092117e-05, 5.222484469413757e-05, 5.4667703807353973e-05, 5.7110562920570374e-05, 5.9553422033786774e-05, 6.199628114700317e-05, 6.443914026021957e-05, 6.688199937343597e-05, 6.932485848665237e-05, 7.176771759986877e-05, 7.421057671308517e-05, 7.665343582630157e-05, 7.909629493951797e-05, 8.153915405273438e-05]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 8.0, 11.0, 3.0, 15.0, 24.0, 12.0, 28.0, 30.0, 54.0, 21.0, 49.0, 53.0, 65.0, 35.0, 59.0, 73.0, 66.0, 34.0, 63.0, 60.0, 10.0, 40.0, 39.0, 38.0, 14.0, 15.0, 21.0, 9.0, 7.0, 13.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8172507882118225e-06, -2.7138739824295044e-06, -2.6104971766471863e-06, -2.507120370864868e-06, -2.40374356508255e-06, -2.300366759300232e-06, -2.196989953517914e-06, -2.0936131477355957e-06, -1.9902363419532776e-06, -1.8868595361709595e-06, -1.7834827303886414e-06, -1.6801059246063232e-06, -1.5767291188240051e-06, -1.473352313041687e-06, -1.369975507259369e-06, -1.2665987014770508e-06, -1.1632218956947327e-06, -1.0598450899124146e-06, -9.564682841300964e-07, -8.530914783477783e-07, -7.497146725654602e-07, -6.463378667831421e-07, -5.42961061000824e-07, -4.3958425521850586e-07, -3.3620744943618774e-07, -2.3283064365386963e-07, -1.2945383787155151e-07, -2.60770320892334e-08, 7.729977369308472e-08, 1.8067657947540283e-07, 2.8405338525772095e-07, 3.8743019104003906e-07, 4.908069968223572e-07, 5.941838026046753e-07, 6.975606083869934e-07, 8.009374141693115e-07, 9.043142199516296e-07, 1.0076910257339478e-06, 1.1110678315162659e-06, 1.214444637298584e-06, 1.317821443080902e-06, 1.4211982488632202e-06, 1.5245750546455383e-06, 1.6279518604278564e-06, 1.7313286662101746e-06, 1.8347054719924927e-06, 1.938082277774811e-06, 2.041459083557129e-06, 2.144835889339447e-06, 2.248212695121765e-06, 2.3515895009040833e-06, 2.4549663066864014e-06, 2.5583431124687195e-06, 2.6617199182510376e-06, 2.7650967240333557e-06, 2.868473529815674e-06, 2.971850335597992e-06, 3.07522714138031e-06, 3.178603947162628e-06, 3.2819807529449463e-06, 3.3853575587272644e-06, 3.4887343645095825e-06, 3.5921111702919006e-06, 3.6954879760742188e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 9.0, 15.0, 16.0, 27.0, 43.0, 72.0, 117.0, 368.0, 2382.0, 982511.0, 60907.0, 1481.0, 253.0, 147.0, 58.0, 28.0, 27.0, 16.0, 11.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018608570098876953, -0.00018006190657615662, -0.0001740381121635437, -0.00016801431775093079, -0.00016199052333831787, -0.00015596672892570496, -0.00014994293451309204, -0.00014391914010047913, -0.0001378953456878662, -0.0001318715512752533, -0.00012584775686264038, -0.00011982396245002747, -0.00011380016803741455, -0.00010777637362480164, -0.00010175257921218872, -9.57287847995758e-05, -8.970499038696289e-05, -8.368119597434998e-05, -7.765740156173706e-05, -7.163360714912415e-05, -6.560981273651123e-05, -5.9586018323898315e-05, -5.35622239112854e-05, -4.7538429498672485e-05, -4.151463508605957e-05, -3.5490840673446655e-05, -2.946704626083374e-05, -2.3443251848220825e-05, -1.741945743560791e-05, -1.1395663022994995e-05, -5.37186861038208e-06, 6.51925802230835e-07, 6.67572021484375e-06, 1.2699514627456665e-05, 1.872330904006958e-05, 2.4747103452682495e-05, 3.077089786529541e-05, 3.6794692277908325e-05, 4.281848669052124e-05, 4.8842281103134155e-05, 5.486607551574707e-05, 6.0889869928359985e-05, 6.69136643409729e-05, 7.293745875358582e-05, 7.896125316619873e-05, 8.498504757881165e-05, 9.100884199142456e-05, 9.703263640403748e-05, 0.00010305643081665039, 0.0001090802252292633, 0.00011510401964187622, 0.00012112781405448914, 0.00012715160846710205, 0.00013317540287971497, 0.00013919919729232788, 0.0001452229917049408, 0.0001512467861175537, 0.00015727058053016663, 0.00016329437494277954, 0.00016931816935539246, 0.00017534196376800537, 0.00018136575818061829, 0.0001873895525932312, 0.00019341334700584412, 0.00019943714141845703]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 16.0, 26.0, 40.0, 82.0, 119.0, 224.0, 150.0, 126.0, 71.0, 59.0, 19.0, 12.0, 8.0, 8.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00021922588348388672, -0.00021213479340076447, -0.0002050437033176422, -0.00019795261323451996, -0.0001908615231513977, -0.00018377043306827545, -0.0001766793429851532, -0.00016958825290203094, -0.0001624971628189087, -0.00015540607273578644, -0.00014831498265266418, -0.00014122389256954193, -0.00013413280248641968, -0.00012704171240329742, -0.00011995062232017517, -0.00011285953223705292, -0.00010576844215393066, -9.867735207080841e-05, -9.158626198768616e-05, -8.44951719045639e-05, -7.740408182144165e-05, -7.03129917383194e-05, -6.322190165519714e-05, -5.613081157207489e-05, -4.903972148895264e-05, -4.194863140583038e-05, -3.485754132270813e-05, -2.7766451239585876e-05, -2.0675361156463623e-05, -1.358427107334137e-05, -6.493180990219116e-06, 5.979090929031372e-07, 7.68899917602539e-06, 1.4780089259147644e-05, 2.1871179342269897e-05, 2.896226942539215e-05, 3.6053359508514404e-05, 4.314444959163666e-05, 5.023553967475891e-05, 5.7326629757881165e-05, 6.441771984100342e-05, 7.150880992412567e-05, 7.859990000724792e-05, 8.569099009037018e-05, 9.278208017349243e-05, 9.987317025661469e-05, 0.00010696426033973694, 0.00011405535042285919, 0.00012114644050598145, 0.0001282375305891037, 0.00013532862067222595, 0.0001424197107553482, 0.00014951080083847046, 0.0001566018909215927, 0.00016369298100471497, 0.00017078407108783722, 0.00017787516117095947, 0.00018496625125408173, 0.00019205734133720398, 0.00019914843142032623, 0.00020623952150344849, 0.00021333061158657074, 0.000220421701669693, 0.00022751279175281525, 0.0002346038818359375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 271.0, 736.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7332834005355835, -0.49449557065963745, -0.2557077705860138, -0.016919970512390137, 0.2218678593635559, 0.46065568923950195, 0.6994434595108032, 0.938231348991394, 1.1770191192626953, 1.4158068895339966, 1.6545947790145874, 1.8933825492858887, 2.1321704387664795, 2.3709583282470703, 2.609745979309082, 2.848533868789673, 3.0873217582702637, 3.3261096477508545, 3.564897298812866, 3.803685188293457, 4.042472839355469, 4.281260967254639, 4.52004861831665, 4.75883674621582, 4.997624397277832, 5.236412048339844, 5.475200176239014, 5.713987827301025, 5.952775478363037, 6.191563606262207, 6.430351257324219, 6.6691389083862305, 6.9079270362854, 7.146714687347412, 7.385502815246582, 7.624290466308594, 7.8630781173706055, 8.101865768432617, 8.340654373168945, 8.579442024230957, 8.818229675292969, 9.05701732635498, 9.295804977416992, 9.53459358215332, 9.773381233215332, 10.012168884277344, 10.250956535339355, 10.489744186401367, 10.728531837463379, 10.96731948852539, 11.206107139587402, 11.444894790649414, 11.683683395385742, 11.922471046447754, 12.161258697509766, 12.400046348571777, 12.638834953308105, 12.877622604370117, 13.116410255432129, 13.35519790649414, 13.593986511230469, 13.83277416229248, 14.071561813354492, 14.310349464416504, 14.549137115478516]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 3.0, 7.0, 9.0, 7.0, 11.0, 20.0, 20.0, 19.0, 21.0, 36.0, 44.0, 23.0, 41.0, 58.0, 49.0, 62.0, 52.0, 57.0, 50.0, 59.0, 39.0, 42.0, 36.0, 38.0, 33.0, 31.0, 22.0, 19.0, 16.0, 22.0, 19.0, 7.0, 4.0, 8.0, 3.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.67372989654541, -2.5913474559783936, -2.508965015411377, -2.4265828132629395, -2.344200372695923, -2.2618179321289062, -2.1794354915618896, -2.097053050994873, -2.0146706104278564, -1.9322881698608398, -1.8499058485031128, -1.7675234079360962, -1.6851409673690796, -1.6027586460113525, -1.520376205444336, -1.4379937648773193, -1.3556114435195923, -1.2732290029525757, -1.1908466815948486, -1.108464241027832, -1.0260818004608154, -0.9436994194984436, -0.8613170385360718, -0.7789345979690552, -0.6965522170066833, -0.6141698360443115, -0.5317873954772949, -0.4494050145149231, -0.3670226037502289, -0.28464019298553467, -0.20225781202316284, -0.11987537145614624, -0.037492990493774414, 0.0448894128203392, 0.12727181613445282, 0.20965421199798584, 0.29203662276268005, 0.37441903352737427, 0.4568014144897461, 0.5391838550567627, 0.6215662360191345, 0.7039486169815063, 0.786331057548523, 0.8687134385108948, 0.9510958194732666, 1.0334782600402832, 1.1158607006072998, 1.1982431411743164, 1.2806254625320435, 1.36300790309906, 1.445390224456787, 1.5277726650238037, 1.6101551055908203, 1.692537546157837, 1.774919867515564, 1.8573023080825806, 1.9396846294403076, 2.022067070007324, 2.104449510574341, 2.1868319511413574, 2.269214153289795, 2.3515965938568115, 2.433979034423828, 2.5163614749908447, 2.5987439155578613]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 7.0, 7.0, 6.0, 7.0, 7.0, 14.0, 28.0, 115.0, 285.0, 4193222.0, 360.0, 83.0, 31.0, 12.0, 6.0, 8.0, 11.0, 3.0, 6.0, 4.0, 5.0, 5.0, 1.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.041015625, -2.941986083984375, -2.84295654296875, -2.743927001953125, -2.6448974609375, -2.545867919921875, -2.44683837890625, -2.347808837890625, -2.248779296875, -2.149749755859375, -2.05072021484375, -1.951690673828125, -1.8526611328125, -1.753631591796875, -1.65460205078125, -1.555572509765625, -1.45654296875, -1.357513427734375, -1.25848388671875, -1.159454345703125, -1.0604248046875, -0.961395263671875, -0.86236572265625, -0.763336181640625, -0.664306640625, -0.565277099609375, -0.46624755859375, -0.367218017578125, -0.2681884765625, -0.169158935546875, -0.07012939453125, 0.028900146484375, 0.1279296875, 0.226959228515625, 0.32598876953125, 0.425018310546875, 0.5240478515625, 0.623077392578125, 0.72210693359375, 0.821136474609375, 0.920166015625, 1.019195556640625, 1.11822509765625, 1.217254638671875, 1.3162841796875, 1.415313720703125, 1.51434326171875, 1.613372802734375, 1.71240234375, 1.811431884765625, 1.91046142578125, 2.009490966796875, 2.1085205078125, 2.207550048828125, 2.30657958984375, 2.405609130859375, 2.504638671875, 2.603668212890625, 2.70269775390625, 2.801727294921875, 2.9007568359375, 2.999786376953125, 3.09881591796875, 3.197845458984375, 3.296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 7.0, 7.0, 6.0, 7.0, 7.0, 13.0, 24.0, 98.0, 220.0, 308.0, 147.0, 40.0, 15.0, 5.0, 6.0, 8.0, 11.0, 3.0, 6.0, 4.0, 5.0, 5.0, 1.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1719970703125, -0.1663951873779297, -0.16079330444335938, -0.15519142150878906, -0.14958953857421875, -0.14398765563964844, -0.13838577270507812, -0.1327838897705078, -0.1271820068359375, -0.12158012390136719, -0.11597824096679688, -0.11037635803222656, -0.10477447509765625, -0.09917259216308594, -0.09357070922851562, -0.08796882629394531, -0.082366943359375, -0.07676506042480469, -0.07116317749023438, -0.06556129455566406, -0.05995941162109375, -0.05435752868652344, -0.048755645751953125, -0.04315376281738281, -0.0375518798828125, -0.03194999694824219, -0.026348114013671875, -0.020746231079101562, -0.01514434814453125, -0.009542465209960938, -0.003940582275390625, 0.0016613006591796875, 0.00726318359375, 0.012865066528320312, 0.018466949462890625, 0.024068832397460938, 0.02967071533203125, 0.03527259826660156, 0.040874481201171875, 0.04647636413574219, 0.0520782470703125, 0.05768013000488281, 0.06328201293945312, 0.06888389587402344, 0.07448577880859375, 0.08008766174316406, 0.08568954467773438, 0.09129142761230469, 0.096893310546875, 0.10249519348144531, 0.10809707641601562, 0.11369895935058594, 0.11930084228515625, 0.12490272521972656, 0.13050460815429688, 0.1361064910888672, 0.1417083740234375, 0.1473102569580078, 0.15291213989257812, 0.15851402282714844, 0.16411590576171875, 0.16971778869628906, 0.17531967163085938, 0.1809215545654297, 0.1865234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 22.0, 79.0, 303.0, 936.0, 765302.0, 3426202.0, 988.0, 294.0, 96.0, 28.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4892578125, -0.473968505859375, -0.45867919921875, -0.443389892578125, -0.4281005859375, -0.412811279296875, -0.39752197265625, -0.382232666015625, -0.366943359375, -0.351654052734375, -0.33636474609375, -0.321075439453125, -0.3057861328125, -0.290496826171875, -0.27520751953125, -0.259918212890625, -0.24462890625, -0.229339599609375, -0.21405029296875, -0.198760986328125, -0.1834716796875, -0.168182373046875, -0.15289306640625, -0.137603759765625, -0.122314453125, -0.107025146484375, -0.09173583984375, -0.076446533203125, -0.0611572265625, -0.045867919921875, -0.03057861328125, -0.015289306640625, 0.0, 0.015289306640625, 0.03057861328125, 0.045867919921875, 0.0611572265625, 0.076446533203125, 0.09173583984375, 0.107025146484375, 0.122314453125, 0.137603759765625, 0.15289306640625, 0.168182373046875, 0.1834716796875, 0.198760986328125, 0.21405029296875, 0.229339599609375, 0.24462890625, 0.259918212890625, 0.27520751953125, 0.290496826171875, 0.3057861328125, 0.321075439453125, 0.33636474609375, 0.351654052734375, 0.366943359375, 0.382232666015625, 0.39752197265625, 0.412811279296875, 0.4281005859375, 0.443389892578125, 0.45867919921875, 0.473968505859375, 0.4892578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 13.0, 3904.0, 122.0, 22.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079345703125, -0.07571792602539062, -0.07209014892578125, -0.06846237182617188, -0.0648345947265625, -0.061206817626953125, -0.05757904052734375, -0.053951263427734375, -0.050323486328125, -0.046695709228515625, -0.04306793212890625, -0.039440155029296875, -0.0358123779296875, -0.032184600830078125, -0.02855682373046875, -0.024929046630859375, -0.02130126953125, -0.017673492431640625, -0.01404571533203125, -0.010417938232421875, -0.0067901611328125, -0.003162384033203125, 0.00046539306640625, 0.004093170166015625, 0.007720947265625, 0.011348724365234375, 0.01497650146484375, 0.018604278564453125, 0.0222320556640625, 0.025859832763671875, 0.02948760986328125, 0.033115386962890625, 0.0367431640625, 0.040370941162109375, 0.04399871826171875, 0.047626495361328125, 0.0512542724609375, 0.054882049560546875, 0.05850982666015625, 0.062137603759765625, 0.065765380859375, 0.06939315795898438, 0.07302093505859375, 0.07664871215820312, 0.0802764892578125, 0.08390426635742188, 0.08753204345703125, 0.09115982055664062, 0.09478759765625, 0.09841537475585938, 0.10204315185546875, 0.10567092895507812, 0.1092987060546875, 0.11292648315429688, 0.11655426025390625, 0.12018203735351562, 0.123809814453125, 0.12743759155273438, 0.13106536865234375, 0.13469314575195312, 0.1383209228515625, 0.14194869995117188, 0.14557647705078125, 0.14920425415039062, 0.15283203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 1011.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289486825466156, -0.22078987956047058, -0.15209291875362396, -0.08339595794677734, -0.014699012041091919, 0.053997933864593506, 0.12269490957260132, 0.19139185547828674, 0.26008880138397217, 0.3287857472896576, 0.397482693195343, 0.46617966890335083, 0.5348765850067139, 0.6035735607147217, 0.6722705364227295, 0.7409675121307373, 0.8096644282341003, 0.8783614039421082, 0.9470583200454712, 1.015755295753479, 1.0844522714614868, 1.153149127960205, 1.221846103668213, 1.2905430793762207, 1.3592400550842285, 1.4279370307922363, 1.4966340065002441, 1.565330982208252, 1.6340278387069702, 1.702724814414978, 1.7714217901229858, 1.8401187658309937, 1.908815622329712, 1.9775125980377197, 2.0462095737457275, 2.1149065494537354, 2.183603525161743, 2.252300262451172, 2.3209972381591797, 2.3896942138671875, 2.4583911895751953, 2.527088165283203, 2.595785140991211, 2.6644821166992188, 2.7331790924072266, 2.8018760681152344, 2.870573043823242, 2.939269781112671, 3.007966995239258, 3.0766639709472656, 3.1453609466552734, 3.2140579223632812, 3.282754898071289, 3.351451873779297, 3.4201488494873047, 3.4888455867767334, 3.557542562484741, 3.626239538192749, 3.694936513900757, 3.7636334896087646, 3.8323304653167725, 3.901027202606201, 3.969724178314209, 4.038421154022217, 4.107118129730225]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 13.0, 14.0, 24.0, 38.0, 38.0, 56.0, 68.0, 61.0, 82.0, 93.0, 76.0, 79.0, 73.0, 71.0, 57.0, 41.0, 26.0, 25.0, 10.0, 19.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24542725086212158, -0.23944883048534393, -0.23347042500972748, -0.22749200463294983, -0.22151358425617218, -0.21553516387939453, -0.20955675840377808, -0.20357833802700043, -0.19759991765022278, -0.19162149727344513, -0.18564309179782867, -0.17966467142105103, -0.17368625104427338, -0.16770783066749573, -0.16172942519187927, -0.15575100481510162, -0.14977259933948517, -0.14379417896270752, -0.13781577348709106, -0.13183735311031342, -0.12585893273353577, -0.11988051980733871, -0.11390210688114166, -0.10792368650436401, -0.10194527357816696, -0.09596686065196991, -0.08998844027519226, -0.08401002734899521, -0.07803161442279816, -0.07205319404602051, -0.06607478111982346, -0.060096364468336105, -0.054117947816848755, -0.048139531165361404, -0.042161114513874054, -0.036182701587677, -0.03020428493618965, -0.0242258682847023, -0.01824745535850525, -0.012269038707017899, -0.006290622055530548, -0.00031220633536577225, 0.005666209384799004, 0.011644624173641205, 0.017623040825128555, 0.023601457476615906, 0.029579870402812958, 0.03555828705430031, 0.04153670370578766, 0.04751512035727501, 0.05349353700876236, 0.05947194993495941, 0.06545037031173706, 0.07142878323793411, 0.07740719616413116, 0.08338561654090881, 0.08936402946710587, 0.09534244239330292, 0.10132086277008057, 0.10729927569627762, 0.11327768862247467, 0.11925610899925232, 0.12523451447486877, 0.13121293485164642, 0.13719135522842407]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 8.0, 6.0, 4.0, 8.0, 10.0, 9.0, 20.0, 23.0, 29.0, 46.0, 60.0, 108.0, 154.0, 236.0, 360.0, 580.0, 858.0, 1322.0, 1988.0, 3633.0, 6693.0, 15312.0, 81848.0, 880311.0, 31740.0, 10488.0, 5085.0, 2822.0, 1695.0, 1060.0, 666.0, 454.0, 314.0, 192.0, 130.0, 95.0, 41.0, 41.0, 25.0, 13.0, 25.0, 16.0, 5.0, 7.0, 9.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.31982421875, -0.31021881103515625, -0.3006134033203125, -0.29100799560546875, -0.281402587890625, -0.27179718017578125, -0.2621917724609375, -0.25258636474609375, -0.24298095703125, -0.23337554931640625, -0.2237701416015625, -0.21416473388671875, -0.204559326171875, -0.19495391845703125, -0.1853485107421875, -0.17574310302734375, -0.1661376953125, -0.15653228759765625, -0.1469268798828125, -0.13732147216796875, -0.127716064453125, -0.11811065673828125, -0.1085052490234375, -0.09889984130859375, -0.08929443359375, -0.07968902587890625, -0.0700836181640625, -0.06047821044921875, -0.050872802734375, -0.04126739501953125, -0.0316619873046875, -0.02205657958984375, -0.012451171875, -0.00284576416015625, 0.0067596435546875, 0.01636505126953125, 0.025970458984375, 0.03557586669921875, 0.0451812744140625, 0.05478668212890625, 0.06439208984375, 0.07399749755859375, 0.0836029052734375, 0.09320831298828125, 0.102813720703125, 0.11241912841796875, 0.1220245361328125, 0.13162994384765625, 0.1412353515625, 0.15084075927734375, 0.1604461669921875, 0.17005157470703125, 0.179656982421875, 0.18926239013671875, 0.1988677978515625, 0.20847320556640625, 0.21807861328125, 0.22768402099609375, 0.2372894287109375, 0.24689483642578125, 0.256500244140625, 0.26610565185546875, 0.2757110595703125, 0.28531646728515625, 0.294921875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 6.0, 8.0, 6.0, 7.0, 7.0, 12.0, 24.0, 95.0, 222.0, 304.0, 152.0, 41.0, 14.0, 6.0, 6.0, 8.0, 11.0, 3.0, 6.0, 4.0, 5.0, 5.0, 1.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1719970703125, -0.1663970947265625, -0.160797119140625, -0.1551971435546875, -0.14959716796875, -0.1439971923828125, -0.138397216796875, -0.1327972412109375, -0.127197265625, -0.1215972900390625, -0.115997314453125, -0.1103973388671875, -0.10479736328125, -0.0991973876953125, -0.093597412109375, -0.0879974365234375, -0.0823974609375, -0.0767974853515625, -0.071197509765625, -0.0655975341796875, -0.05999755859375, -0.0543975830078125, -0.048797607421875, -0.0431976318359375, -0.03759765625, -0.0319976806640625, -0.026397705078125, -0.0207977294921875, -0.01519775390625, -0.0095977783203125, -0.003997802734375, 0.0016021728515625, 0.0072021484375, 0.0128021240234375, 0.018402099609375, 0.0240020751953125, 0.02960205078125, 0.0352020263671875, 0.040802001953125, 0.0464019775390625, 0.052001953125, 0.0576019287109375, 0.063201904296875, 0.0688018798828125, 0.07440185546875, 0.0800018310546875, 0.085601806640625, 0.0912017822265625, 0.0968017578125, 0.1024017333984375, 0.108001708984375, 0.1136016845703125, 0.11920166015625, 0.1248016357421875, 0.130401611328125, 0.1360015869140625, 0.1416015625, 0.1472015380859375, 0.152801513671875, 0.1584014892578125, 0.16400146484375, 0.1696014404296875, 0.175201416015625, 0.1808013916015625, 0.1864013671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 11.0, 10.0, 9.0, 21.0, 19.0, 17.0, 30.0, 32.0, 55.0, 51.0, 79.0, 129.0, 189.0, 293.0, 579.0, 1307.0, 6793.0, 1008275.0, 27093.0, 1737.0, 724.0, 352.0, 204.0, 125.0, 97.0, 68.0, 50.0, 40.0, 28.0, 25.0, 21.0, 19.0, 13.0, 7.0, 7.0, 7.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6693191528320312, -0.6467437744140625, -0.6241683959960938, -0.601593017578125, -0.5790176391601562, -0.5564422607421875, -0.5338668823242188, -0.51129150390625, -0.48871612548828125, -0.4661407470703125, -0.44356536865234375, -0.420989990234375, -0.39841461181640625, -0.3758392333984375, -0.35326385498046875, -0.3306884765625, -0.30811309814453125, -0.2855377197265625, -0.26296234130859375, -0.240386962890625, -0.21781158447265625, -0.1952362060546875, -0.17266082763671875, -0.15008544921875, -0.12751007080078125, -0.1049346923828125, -0.08235931396484375, -0.059783935546875, -0.03720855712890625, -0.0146331787109375, 0.00794219970703125, 0.030517578125, 0.05309295654296875, 0.0756683349609375, 0.09824371337890625, 0.120819091796875, 0.14339447021484375, 0.1659698486328125, 0.18854522705078125, 0.21112060546875, 0.23369598388671875, 0.2562713623046875, 0.27884674072265625, 0.301422119140625, 0.32399749755859375, 0.3465728759765625, 0.36914825439453125, 0.3917236328125, 0.41429901123046875, 0.4368743896484375, 0.45944976806640625, 0.482025146484375, 0.5046005249023438, 0.5271759033203125, 0.5497512817382812, 0.57232666015625, 0.5949020385742188, 0.6174774169921875, 0.6400527954101562, 0.662628173828125, 0.6852035522460938, 0.7077789306640625, 0.7303543090820312, 0.7529296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 11.0, 8.0, 8.0, 19.0, 14.0, 14.0, 19.0, 19.0, 30.0, 22.0, 30.0, 41.0, 38.0, 39.0, 45.0, 58.0, 41.0, 44.0, 29.0, 46.0, 36.0, 49.0, 42.0, 35.0, 34.0, 32.0, 28.0, 25.0, 21.0, 20.0, 18.0, 17.0, 12.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4716796875, -0.45629119873046875, -0.4409027099609375, -0.42551422119140625, -0.410125732421875, -0.39473724365234375, -0.3793487548828125, -0.36396026611328125, -0.34857177734375, -0.33318328857421875, -0.3177947998046875, -0.30240631103515625, -0.287017822265625, -0.27162933349609375, -0.2562408447265625, -0.24085235595703125, -0.2254638671875, -0.21007537841796875, -0.1946868896484375, -0.17929840087890625, -0.163909912109375, -0.14852142333984375, -0.1331329345703125, -0.11774444580078125, -0.10235595703125, -0.08696746826171875, -0.0715789794921875, -0.05619049072265625, -0.040802001953125, -0.02541351318359375, -0.0100250244140625, 0.00536346435546875, 0.020751953125, 0.03614044189453125, 0.0515289306640625, 0.06691741943359375, 0.082305908203125, 0.09769439697265625, 0.1130828857421875, 0.12847137451171875, 0.14385986328125, 0.15924835205078125, 0.1746368408203125, 0.19002532958984375, 0.205413818359375, 0.22080230712890625, 0.2361907958984375, 0.25157928466796875, 0.2669677734375, 0.28235626220703125, 0.2977447509765625, 0.31313323974609375, 0.328521728515625, 0.34391021728515625, 0.3592987060546875, 0.37468719482421875, 0.39007568359375, 0.40546417236328125, 0.4208526611328125, 0.43624114990234375, 0.451629638671875, 0.46701812744140625, 0.4824066162109375, 0.49779510498046875, 0.51318359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 9.0, 21.0, 27.0, 53.0, 83.0, 123.0, 235.0, 421.0, 933.0, 1870.0, 5552.0, 23885.0, 796688.0, 196642.0, 14869.0, 4068.0, 1548.0, 678.0, 373.0, 178.0, 99.0, 61.0, 45.0, 19.0, 11.0, 16.0, 11.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023066997528076172, -0.00022364966571331024, -0.00021662935614585876, -0.0002096090465784073, -0.0002025887370109558, -0.00019556842744350433, -0.00018854811787605286, -0.00018152780830860138, -0.0001745074987411499, -0.00016748718917369843, -0.00016046687960624695, -0.00015344657003879547, -0.000146426260471344, -0.00013940595090389252, -0.00013238564133644104, -0.00012536533176898956, -0.00011834502220153809, -0.00011132471263408661, -0.00010430440306663513, -9.728409349918365e-05, -9.026378393173218e-05, -8.32434743642807e-05, -7.622316479682922e-05, -6.920285522937775e-05, -6.218254566192627e-05, -5.516223609447479e-05, -4.8141926527023315e-05, -4.112161695957184e-05, -3.410130739212036e-05, -2.7080997824668884e-05, -2.0060688257217407e-05, -1.304037868976593e-05, -6.020069122314453e-06, 1.000240445137024e-06, 8.020550012588501e-06, 1.5040859580039978e-05, 2.2061169147491455e-05, 2.9081478714942932e-05, 3.610178828239441e-05, 4.3122097849845886e-05, 5.014240741729736e-05, 5.716271698474884e-05, 6.418302655220032e-05, 7.12033361196518e-05, 7.822364568710327e-05, 8.524395525455475e-05, 9.226426482200623e-05, 9.92845743894577e-05, 0.00010630488395690918, 0.00011332519352436066, 0.00012034550309181213, 0.0001273658126592636, 0.0001343861222267151, 0.00014140643179416656, 0.00014842674136161804, 0.00015544705092906952, 0.000162467360496521, 0.00016948767006397247, 0.00017650797963142395, 0.00018352828919887543, 0.0001905485987663269, 0.00019756890833377838, 0.00020458921790122986, 0.00021160952746868134, 0.0002186298370361328]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 12.0, 10.0, 27.0, 31.0, 33.0, 45.0, 66.0, 87.0, 96.0, 97.0, 112.0, 91.0, 70.0, 59.0, 46.0, 17.0, 19.0, 11.0, 17.0, 8.0, 11.0, 10.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.000301361083984e-06, -8.746981620788574e-06, -8.493661880493164e-06, -8.240342140197754e-06, -7.987022399902344e-06, -7.733702659606934e-06, -7.4803829193115234e-06, -7.227063179016113e-06, -6.973743438720703e-06, -6.720423698425293e-06, -6.467103958129883e-06, -6.213784217834473e-06, -5.9604644775390625e-06, -5.707144737243652e-06, -5.453824996948242e-06, -5.200505256652832e-06, -4.947185516357422e-06, -4.693865776062012e-06, -4.4405460357666016e-06, -4.187226295471191e-06, -3.933906555175781e-06, -3.680586814880371e-06, -3.427267074584961e-06, -3.1739473342895508e-06, -2.9206275939941406e-06, -2.6673078536987305e-06, -2.4139881134033203e-06, -2.16066837310791e-06, -1.9073486328125e-06, -1.6540288925170898e-06, -1.4007091522216797e-06, -1.1473894119262695e-06, -8.940696716308594e-07, -6.407499313354492e-07, -3.8743019104003906e-07, -1.341104507446289e-07, 1.1920928955078125e-07, 3.725290298461914e-07, 6.258487701416016e-07, 8.791685104370117e-07, 1.1324882507324219e-06, 1.385807991027832e-06, 1.6391277313232422e-06, 1.8924474716186523e-06, 2.1457672119140625e-06, 2.3990869522094727e-06, 2.652406692504883e-06, 2.905726432800293e-06, 3.159046173095703e-06, 3.4123659133911133e-06, 3.6656856536865234e-06, 3.919005393981934e-06, 4.172325134277344e-06, 4.425644874572754e-06, 4.678964614868164e-06, 4.932284355163574e-06, 5.185604095458984e-06, 5.4389238357543945e-06, 5.692243576049805e-06, 5.945563316345215e-06, 6.198883056640625e-06, 6.452202796936035e-06, 6.705522537231445e-06, 6.9588422775268555e-06, 7.212162017822266e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 8.0, 6.0, 14.0, 37.0, 61.0, 187.0, 820.0, 1037219.0, 9556.0, 432.0, 111.0, 48.0, 23.0, 14.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006570816040039062, -0.0006282925605773926, -0.0005995035171508789, -0.0005707144737243652, -0.0005419254302978516, -0.0005131363868713379, -0.0004843473434448242, -0.00045555830001831055, -0.0004267692565917969, -0.0003979802131652832, -0.00036919116973876953, -0.00034040212631225586, -0.0003116130828857422, -0.0002828240394592285, -0.00025403499603271484, -0.00022524595260620117, -0.0001964569091796875, -0.00016766786575317383, -0.00013887882232666016, -0.00011008977890014648, -8.130073547363281e-05, -5.251169204711914e-05, -2.372264862060547e-05, 5.066394805908203e-06, 3.3855438232421875e-05, 6.264448165893555e-05, 9.143352508544922e-05, 0.00012022256851196289, 0.00014901161193847656, 0.00017780065536499023, 0.0002065896987915039, 0.00023537874221801758, 0.00026416778564453125, 0.0002929568290710449, 0.0003217458724975586, 0.00035053491592407227, 0.00037932395935058594, 0.0004081130027770996, 0.0004369020462036133, 0.00046569108963012695, 0.0004944801330566406, 0.0005232691764831543, 0.000552058219909668, 0.0005808472633361816, 0.0006096363067626953, 0.000638425350189209, 0.0006672143936157227, 0.0006960034370422363, 0.00072479248046875, 0.0007535815238952637, 0.0007823705673217773, 0.000811159610748291, 0.0008399486541748047, 0.0008687376976013184, 0.000897526741027832, 0.0009263157844543457, 0.0009551048278808594, 0.000983893871307373, 0.0010126829147338867, 0.0010414719581604004, 0.001070261001586914, 0.0010990500450134277, 0.0011278390884399414, 0.001156628131866455, 0.0011854171752929688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 8.0, 22.0, 33.0, 80.0, 146.0, 252.0, 218.0, 125.0, 54.0, 29.0, 15.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044846534729003906, -0.0004288293421268463, -0.00040919333696365356, -0.0003895573318004608, -0.00036992132663726807, -0.0003502853214740753, -0.00033064931631088257, -0.0003110133111476898, -0.00029137730598449707, -0.0002717413008213043, -0.00025210529565811157, -0.00023246929049491882, -0.00021283328533172607, -0.00019319728016853333, -0.00017356127500534058, -0.00015392526984214783, -0.00013428926467895508, -0.00011465325951576233, -9.501725435256958e-05, -7.538124918937683e-05, -5.574524402618408e-05, -3.610923886299133e-05, -1.6473233699798584e-05, 3.162771463394165e-06, 2.2798776626586914e-05, 4.243478178977966e-05, 6.207078695297241e-05, 8.170679211616516e-05, 0.00010134279727935791, 0.00012097880244255066, 0.0001406148076057434, 0.00016025081276893616, 0.0001798868179321289, 0.00019952282309532166, 0.0002191588282585144, 0.00023879483342170715, 0.0002584308385848999, 0.00027806684374809265, 0.0002977028489112854, 0.00031733885407447815, 0.0003369748592376709, 0.00035661086440086365, 0.0003762468695640564, 0.00039588287472724915, 0.0004155188798904419, 0.00043515488505363464, 0.0004547908902168274, 0.00047442689538002014, 0.0004940629005432129, 0.0005136989057064056, 0.0005333349108695984, 0.0005529709160327911, 0.0005726069211959839, 0.0005922429263591766, 0.0006118789315223694, 0.0006315149366855621, 0.0006511509418487549, 0.0006707869470119476, 0.0006904229521751404, 0.0007100589573383331, 0.0007296949625015259, 0.0007493309676647186, 0.0007689669728279114, 0.0007886029779911041, 0.0008082389831542969]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [93.0, 919.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4613819122314453, -0.06981310248374939, 0.32175570726394653, 0.7133245468139648, 1.1048933267593384, 1.496462106704712, 1.888031005859375, 2.279599666595459, 2.671168565750122, 3.062737464904785, 3.454306125640869, 3.8458750247955322, 4.237443923950195, 4.629012584686279, 5.020581245422363, 5.4121503829956055, 5.8037190437316895, 6.195287704467773, 6.586856842041016, 6.9784255027771, 7.369994163513184, 7.761563301086426, 8.153131484985352, 8.544700622558594, 8.936269760131836, 9.327838897705078, 9.719407081604004, 10.110976219177246, 10.502545356750488, 10.894113540649414, 11.285682678222656, 11.677251815795898, 12.068819999694824, 12.460389137268066, 12.851957321166992, 13.243526458740234, 13.635095596313477, 14.026663780212402, 14.418232917785645, 14.80980110168457, 15.201370239257812, 15.592939376831055, 15.98450756072998, 16.376075744628906, 16.76764488220215, 17.15921401977539, 17.550783157348633, 17.942352294921875, 18.333921432495117, 18.72549057006836, 19.1170597076416, 19.508628845214844, 19.900196075439453, 20.291765213012695, 20.683334350585938, 21.07490348815918, 21.46647071838379, 21.85803985595703, 22.249608993530273, 22.641178131103516, 23.032745361328125, 23.424314498901367, 23.81588363647461, 24.20745277404785, 24.599021911621094]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 13.0, 10.0, 11.0, 11.0, 17.0, 21.0, 22.0, 22.0, 27.0, 30.0, 31.0, 28.0, 43.0, 48.0, 38.0, 52.0, 44.0, 54.0, 56.0, 39.0, 36.0, 48.0, 43.0, 33.0, 23.0, 41.0, 34.0, 19.0, 17.0, 11.0, 13.0, 16.0, 5.0, 5.0, 10.0, 5.0, 2.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.792710065841675, -2.708439350128174, -2.624168634414673, -2.539897918701172, -2.45562744140625, -2.371356725692749, -2.287086009979248, -2.202815294265747, -2.118544578552246, -2.034273862838745, -1.9500032663345337, -1.8657325506210327, -1.7814619541168213, -1.6971912384033203, -1.6129205226898193, -1.5286498069763184, -1.4443793296813965, -1.3601086139678955, -1.275838017463684, -1.191567301750183, -1.1072967052459717, -1.0230259895324707, -0.9387552738189697, -0.8544846177101135, -0.7702139616012573, -0.6859433054924011, -0.6016726493835449, -0.517401933670044, -0.43313127756118774, -0.34886062145233154, -0.26458990573883057, -0.18031924962997437, -0.09604883193969727, -0.01177816092967987, 0.07249251008033752, 0.1567631959915161, 0.24103385210037231, 0.3253045082092285, 0.4095752239227295, 0.4938458800315857, 0.5781165361404419, 0.6623871922492981, 0.7466578483581543, 0.8309285640716553, 0.9151992201805115, 0.9994698762893677, 1.0837405920028687, 1.16801118850708, 1.252281904220581, 1.336552619934082, 1.4208232164382935, 1.5050939321517944, 1.5893645286560059, 1.6736352443695068, 1.7579059600830078, 1.8421766757965088, 1.9264472723007202, 2.0107178688049316, 2.0949885845184326, 2.1792593002319336, 2.2635300159454346, 2.3478007316589355, 2.4320712089538574, 2.5163419246673584, 2.6006126403808594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 9.0, 8.0, 23.0, 16.0, 23.0, 29.0, 34.0, 65.0, 675.0, 3261.0, 4140667.0, 47485.0, 1303.0, 354.0, 50.0, 42.0, 32.0, 33.0, 16.0, 19.0, 11.0, 18.0, 11.0, 7.0, 9.0, 8.0, 4.0, 10.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.372314453125, -0.36028289794921875, -0.3482513427734375, -0.33621978759765625, -0.324188232421875, -0.31215667724609375, -0.3001251220703125, -0.28809356689453125, -0.27606201171875, -0.26403045654296875, -0.2519989013671875, -0.23996734619140625, -0.227935791015625, -0.21590423583984375, -0.2038726806640625, -0.19184112548828125, -0.1798095703125, -0.16777801513671875, -0.1557464599609375, -0.14371490478515625, -0.131683349609375, -0.11965179443359375, -0.1076202392578125, -0.09558868408203125, -0.08355712890625, -0.07152557373046875, -0.0594940185546875, -0.04746246337890625, -0.035430908203125, -0.02339935302734375, -0.0113677978515625, 0.00066375732421875, 0.0126953125, 0.02472686767578125, 0.0367584228515625, 0.04878997802734375, 0.060821533203125, 0.07285308837890625, 0.0848846435546875, 0.09691619873046875, 0.10894775390625, 0.12097930908203125, 0.1330108642578125, 0.14504241943359375, 0.157073974609375, 0.16910552978515625, 0.1811370849609375, 0.19316864013671875, 0.2052001953125, 0.21723175048828125, 0.2292633056640625, 0.24129486083984375, 0.253326416015625, 0.26535797119140625, 0.2773895263671875, 0.28942108154296875, 0.30145263671875, 0.31348419189453125, 0.3255157470703125, 0.33754730224609375, 0.349578857421875, 0.36161041259765625, 0.3736419677734375, 0.38567352294921875, 0.397705078125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 3.0, 10.0, 7.0, 6.0, 7.0, 11.0, 15.0, 78.0, 187.0, 302.0, 199.0, 54.0, 17.0, 5.0, 7.0, 9.0, 11.0, 3.0, 7.0, 2.0, 6.0, 6.0, 0.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1715087890625, -0.16596603393554688, -0.16042327880859375, -0.15488052368164062, -0.1493377685546875, -0.14379501342773438, -0.13825225830078125, -0.13270950317382812, -0.127166748046875, -0.12162399291992188, -0.11608123779296875, -0.11053848266601562, -0.1049957275390625, -0.09945297241210938, -0.09391021728515625, -0.08836746215820312, -0.08282470703125, -0.07728195190429688, -0.07173919677734375, -0.06619644165039062, -0.0606536865234375, -0.055110931396484375, -0.04956817626953125, -0.044025421142578125, -0.038482666015625, -0.032939910888671875, -0.02739715576171875, -0.021854400634765625, -0.0163116455078125, -0.010768890380859375, -0.00522613525390625, 0.000316619873046875, 0.005859375, 0.011402130126953125, 0.01694488525390625, 0.022487640380859375, 0.0280303955078125, 0.033573150634765625, 0.03911590576171875, 0.044658660888671875, 0.050201416015625, 0.055744171142578125, 0.06128692626953125, 0.06682968139648438, 0.0723724365234375, 0.07791519165039062, 0.08345794677734375, 0.08900070190429688, 0.09454345703125, 0.10008621215820312, 0.10562896728515625, 0.11117172241210938, 0.1167144775390625, 0.12225723266601562, 0.12779998779296875, 0.13334274291992188, 0.138885498046875, 0.14442825317382812, 0.14997100830078125, 0.15551376342773438, 0.1610565185546875, 0.16659927368164062, 0.17214202880859375, 0.17768478393554688, 0.1832275390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 17.0, 70.0, 208.0, 516.0, 1681.0, 19832.0, 4168042.0, 2709.0, 760.0, 277.0, 79.0, 26.0, 14.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.329833984375, -0.32045745849609375, -0.3110809326171875, -0.30170440673828125, -0.292327880859375, -0.28295135498046875, -0.2735748291015625, -0.26419830322265625, -0.25482177734375, -0.24544525146484375, -0.2360687255859375, -0.22669219970703125, -0.217315673828125, -0.20793914794921875, -0.1985626220703125, -0.18918609619140625, -0.1798095703125, -0.17043304443359375, -0.1610565185546875, -0.15167999267578125, -0.142303466796875, -0.13292694091796875, -0.1235504150390625, -0.11417388916015625, -0.10479736328125, -0.09542083740234375, -0.0860443115234375, -0.07666778564453125, -0.067291259765625, -0.05791473388671875, -0.0485382080078125, -0.03916168212890625, -0.02978515625, -0.02040863037109375, -0.0110321044921875, -0.00165557861328125, 0.007720947265625, 0.01709747314453125, 0.0264739990234375, 0.03585052490234375, 0.04522705078125, 0.05460357666015625, 0.0639801025390625, 0.07335662841796875, 0.082733154296875, 0.09210968017578125, 0.1014862060546875, 0.11086273193359375, 0.1202392578125, 0.12961578369140625, 0.1389923095703125, 0.14836883544921875, 0.157745361328125, 0.16712188720703125, 0.1764984130859375, 0.18587493896484375, 0.19525146484375, 0.20462799072265625, 0.2140045166015625, 0.22338104248046875, 0.232757568359375, 0.24213409423828125, 0.2515106201171875, 0.26088714599609375, 0.270263671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 9.0, 16.0, 39.0, 3805.0, 153.0, 28.0, 10.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0980224609375, -0.09462356567382812, -0.09122467041015625, -0.08782577514648438, -0.0844268798828125, -0.08102798461914062, -0.07762908935546875, -0.07423019409179688, -0.070831298828125, -0.06743240356445312, -0.06403350830078125, -0.060634613037109375, -0.0572357177734375, -0.053836822509765625, -0.05043792724609375, -0.047039031982421875, -0.04364013671875, -0.040241241455078125, -0.03684234619140625, -0.033443450927734375, -0.0300445556640625, -0.026645660400390625, -0.02324676513671875, -0.019847869873046875, -0.016448974609375, -0.013050079345703125, -0.00965118408203125, -0.006252288818359375, -0.0028533935546875, 0.000545501708984375, 0.00394439697265625, 0.007343292236328125, 0.0107421875, 0.014141082763671875, 0.01753997802734375, 0.020938873291015625, 0.0243377685546875, 0.027736663818359375, 0.03113555908203125, 0.034534454345703125, 0.037933349609375, 0.041332244873046875, 0.04473114013671875, 0.048130035400390625, 0.0515289306640625, 0.054927825927734375, 0.05832672119140625, 0.061725616455078125, 0.06512451171875, 0.06852340698242188, 0.07192230224609375, 0.07532119750976562, 0.0787200927734375, 0.08211898803710938, 0.08551788330078125, 0.08891677856445312, 0.092315673828125, 0.09571456909179688, 0.09911346435546875, 0.10251235961914062, 0.1059112548828125, 0.10931015014648438, 0.11270904541015625, 0.11610794067382812, 0.1195068359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 228.0, 785.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20907212793827057, -0.18825598061084747, -0.16743981838226318, -0.1466236710548401, -0.125807523727417, -0.1049913763999939, -0.0841752216219902, -0.06335906684398651, -0.042542919516563416, -0.02172676846385002, -0.0009106174111366272, 0.019905533641576767, 0.04072168469429016, 0.06153783202171326, 0.08235398679971695, 0.10317014157772064, 0.12398628890514374, 0.14480243623256683, 0.16561859846115112, 0.18643474578857422, 0.20725089311599731, 0.2280670404434204, 0.2488831877708435, 0.2696993350982666, 0.2905154824256897, 0.3113316297531128, 0.3321477770805359, 0.352963924407959, 0.3737800717353821, 0.3945962190628052, 0.41541239619255066, 0.43622854351997375, 0.45704472064971924, 0.47786086797714233, 0.49867701530456543, 0.5194931626319885, 0.5403093099594116, 0.5611254572868347, 0.5819416046142578, 0.6027578115463257, 0.623573899269104, 0.6443900465965271, 0.6652061939239502, 0.6860223412513733, 0.7068384885787964, 0.7276546359062195, 0.7484707832336426, 0.7692869901657104, 0.7901031374931335, 0.8109192848205566, 0.8317354321479797, 0.8525515794754028, 0.8733677268028259, 0.894183874130249, 0.9150000214576721, 0.9358161687850952, 0.9566323757171631, 0.9774485230445862, 0.9982646703720093, 1.0190808773040771, 1.0398969650268555, 1.0607131719589233, 1.0815292596817017, 1.1023454666137695, 1.1231615543365479]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 11.0, 9.0, 19.0, 21.0, 33.0, 32.0, 45.0, 50.0, 55.0, 64.0, 64.0, 72.0, 82.0, 72.0, 61.0, 65.0, 52.0, 45.0, 36.0, 34.0, 23.0, 16.0, 15.0, 6.0, 8.0, 8.0, 8.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1929013729095459, -0.18761718273162842, -0.18233300745487213, -0.17704881727695465, -0.17176462709903717, -0.16648045182228088, -0.1611962616443634, -0.15591207146644592, -0.15062788128852844, -0.14534369111061096, -0.14005951583385468, -0.1347753256559372, -0.12949113547801971, -0.12420695275068283, -0.11892277002334595, -0.11363857984542847, -0.10835440456867218, -0.1030702218413353, -0.09778603166341782, -0.09250184893608093, -0.08721765875816345, -0.08193347603082657, -0.07664929330348969, -0.0713651031255722, -0.06608092039823532, -0.06079673394560814, -0.05551254749298096, -0.050228364765644073, -0.04494417831301689, -0.03965999186038971, -0.034375809133052826, -0.029091622680425644, -0.023807436227798462, -0.01852324977517128, -0.013239065185189247, -0.007954880595207214, -0.0026706941425800323, 0.0026134923100471497, 0.007897675037384033, 0.013181861490011215, 0.018466047942638397, 0.02375023439526558, 0.029034418985247612, 0.034318603575229645, 0.03960279002785683, 0.04488697648048401, 0.05017115920782089, 0.055455345660448074, 0.060739532113075256, 0.06602371484041214, 0.07130790501832962, 0.0765920877456665, 0.08187627792358398, 0.08716046065092087, 0.09244464337825775, 0.09772883355617523, 0.10301301628351212, 0.108297199010849, 0.11358138918876648, 0.11886557191610336, 0.12414975464344025, 0.12943394482135773, 0.134718120098114, 0.1400023102760315, 0.14528650045394897]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 12.0, 3.0, 4.0, 12.0, 9.0, 11.0, 11.0, 29.0, 19.0, 29.0, 24.0, 65.0, 62.0, 124.0, 173.0, 293.0, 474.0, 871.0, 1447.0, 2742.0, 6115.0, 16192.0, 207158.0, 781078.0, 18597.0, 6257.0, 2783.0, 1488.0, 901.0, 533.0, 352.0, 250.0, 108.0, 99.0, 50.0, 43.0, 26.0, 28.0, 14.0, 16.0, 12.0, 14.0, 11.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.25927734375, -0.2514362335205078, -0.24359512329101562, -0.23575401306152344, -0.22791290283203125, -0.22007179260253906, -0.21223068237304688, -0.2043895721435547, -0.1965484619140625, -0.1887073516845703, -0.18086624145507812, -0.17302513122558594, -0.16518402099609375, -0.15734291076660156, -0.14950180053710938, -0.1416606903076172, -0.133819580078125, -0.1259784698486328, -0.11813735961914062, -0.11029624938964844, -0.10245513916015625, -0.09461402893066406, -0.08677291870117188, -0.07893180847167969, -0.0710906982421875, -0.06324958801269531, -0.055408477783203125, -0.04756736755371094, -0.03972625732421875, -0.03188514709472656, -0.024044036865234375, -0.016202926635742188, -0.00836181640625, -0.0005207061767578125, 0.007320404052734375, 0.015161514282226562, 0.02300262451171875, 0.030843734741210938, 0.038684844970703125, 0.04652595520019531, 0.0543670654296875, 0.06220817565917969, 0.07004928588867188, 0.07789039611816406, 0.08573150634765625, 0.09357261657714844, 0.10141372680664062, 0.10925483703613281, 0.117095947265625, 0.12493705749511719, 0.13277816772460938, 0.14061927795410156, 0.14846038818359375, 0.15630149841308594, 0.16414260864257812, 0.1719837188720703, 0.1798248291015625, 0.1876659393310547, 0.19550704956054688, 0.20334815979003906, 0.21118927001953125, 0.21903038024902344, 0.22687149047851562, 0.2347126007080078, 0.2425537109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 3.0, 11.0, 6.0, 6.0, 7.0, 11.0, 15.0, 77.0, 188.0, 302.0, 199.0, 54.0, 17.0, 5.0, 7.0, 9.0, 11.0, 3.0, 6.0, 3.0, 6.0, 6.0, 0.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17138671875, -0.1658477783203125, -0.160308837890625, -0.1547698974609375, -0.14923095703125, -0.1436920166015625, -0.138153076171875, -0.1326141357421875, -0.1270751953125, -0.1215362548828125, -0.115997314453125, -0.1104583740234375, -0.10491943359375, -0.0993804931640625, -0.093841552734375, -0.0883026123046875, -0.082763671875, -0.0772247314453125, -0.071685791015625, -0.0661468505859375, -0.06060791015625, -0.0550689697265625, -0.049530029296875, -0.0439910888671875, -0.0384521484375, -0.0329132080078125, -0.027374267578125, -0.0218353271484375, -0.01629638671875, -0.0107574462890625, -0.005218505859375, 0.0003204345703125, 0.005859375, 0.0113983154296875, 0.016937255859375, 0.0224761962890625, 0.02801513671875, 0.0335540771484375, 0.039093017578125, 0.0446319580078125, 0.0501708984375, 0.0557098388671875, 0.061248779296875, 0.0667877197265625, 0.07232666015625, 0.0778656005859375, 0.083404541015625, 0.0889434814453125, 0.094482421875, 0.1000213623046875, 0.105560302734375, 0.1110992431640625, 0.11663818359375, 0.1221771240234375, 0.127716064453125, 0.1332550048828125, 0.1387939453125, 0.1443328857421875, 0.149871826171875, 0.1554107666015625, 0.16094970703125, 0.1664886474609375, 0.172027587890625, 0.1775665283203125, 0.18310546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 5.0, 4.0, 7.0, 2.0, 2.0, 10.0, 11.0, 12.0, 20.0, 16.0, 21.0, 25.0, 29.0, 32.0, 54.0, 86.0, 92.0, 151.0, 286.0, 770.0, 2711.0, 835413.0, 205282.0, 2103.0, 589.0, 273.0, 144.0, 95.0, 81.0, 31.0, 27.0, 31.0, 30.0, 16.0, 19.0, 17.0, 14.0, 13.0, 11.0, 2.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5396804809570312, -0.5222320556640625, -0.5047836303710938, -0.487335205078125, -0.46988677978515625, -0.4524383544921875, -0.43498992919921875, -0.41754150390625, -0.40009307861328125, -0.3826446533203125, -0.36519622802734375, -0.347747802734375, -0.33029937744140625, -0.3128509521484375, -0.29540252685546875, -0.2779541015625, -0.26050567626953125, -0.2430572509765625, -0.22560882568359375, -0.208160400390625, -0.19071197509765625, -0.1732635498046875, -0.15581512451171875, -0.13836669921875, -0.12091827392578125, -0.1034698486328125, -0.08602142333984375, -0.068572998046875, -0.05112457275390625, -0.0336761474609375, -0.01622772216796875, 0.001220703125, 0.01866912841796875, 0.0361175537109375, 0.05356597900390625, 0.071014404296875, 0.08846282958984375, 0.1059112548828125, 0.12335968017578125, 0.14080810546875, 0.15825653076171875, 0.1757049560546875, 0.19315338134765625, 0.210601806640625, 0.22805023193359375, 0.2454986572265625, 0.26294708251953125, 0.2803955078125, 0.29784393310546875, 0.3152923583984375, 0.33274078369140625, 0.350189208984375, 0.36763763427734375, 0.3850860595703125, 0.40253448486328125, 0.41998291015625, 0.43743133544921875, 0.4548797607421875, 0.47232818603515625, 0.489776611328125, 0.5072250366210938, 0.5246734619140625, 0.5421218872070312, 0.5595703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 5.0, 4.0, 7.0, 2.0, 2.0, 10.0, 11.0, 11.0, 20.0, 16.0, 17.0, 25.0, 22.0, 22.0, 36.0, 41.0, 34.0, 40.0, 43.0, 55.0, 44.0, 41.0, 53.0, 37.0, 33.0, 54.0, 46.0, 42.0, 45.0, 20.0, 16.0, 23.0, 22.0, 14.0, 17.0, 15.0, 14.0, 13.0, 11.0, 2.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4779548645019531, -0.46250152587890625, -0.4470481872558594, -0.4315948486328125, -0.4161415100097656, -0.40068817138671875, -0.3852348327636719, -0.369781494140625, -0.3543281555175781, -0.33887481689453125, -0.3234214782714844, -0.3079681396484375, -0.2925148010253906, -0.27706146240234375, -0.2616081237792969, -0.24615478515625, -0.23070144653320312, -0.21524810791015625, -0.19979476928710938, -0.1843414306640625, -0.16888809204101562, -0.15343475341796875, -0.13798141479492188, -0.122528076171875, -0.10707473754882812, -0.09162139892578125, -0.07616806030273438, -0.0607147216796875, -0.045261383056640625, -0.02980804443359375, -0.014354705810546875, 0.0010986328125, 0.016551971435546875, 0.03200531005859375, 0.047458648681640625, 0.0629119873046875, 0.07836532592773438, 0.09381866455078125, 0.10927200317382812, 0.124725341796875, 0.14017868041992188, 0.15563201904296875, 0.17108535766601562, 0.1865386962890625, 0.20199203491210938, 0.21744537353515625, 0.23289871215820312, 0.24835205078125, 0.2638053894042969, 0.27925872802734375, 0.2947120666503906, 0.3101654052734375, 0.3256187438964844, 0.34107208251953125, 0.3565254211425781, 0.371978759765625, 0.3874320983886719, 0.40288543701171875, 0.4183387756347656, 0.4337921142578125, 0.4492454528808594, 0.46469879150390625, 0.4801521301269531, 0.49560546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 18.0, 27.0, 27.0, 53.0, 97.0, 188.0, 347.0, 710.0, 2096.0, 11548.0, 703009.0, 316938.0, 10090.0, 1996.0, 697.0, 310.0, 131.0, 91.0, 65.0, 35.0, 17.0, 17.0, 4.0, 9.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002048015594482422, -0.00019773095846176147, -0.00019066035747528076, -0.00018358975648880005, -0.00017651915550231934, -0.00016944855451583862, -0.0001623779535293579, -0.0001553073525428772, -0.00014823675155639648, -0.00014116615056991577, -0.00013409554958343506, -0.00012702494859695435, -0.00011995434761047363, -0.00011288374662399292, -0.00010581314563751221, -9.87425446510315e-05, -9.167194366455078e-05, -8.460134267807007e-05, -7.753074169158936e-05, -7.046014070510864e-05, -6.338953971862793e-05, -5.631893873214722e-05, -4.9248337745666504e-05, -4.217773675918579e-05, -3.510713577270508e-05, -2.8036534786224365e-05, -2.0965933799743652e-05, -1.389533281326294e-05, -6.8247318267822266e-06, 2.4586915969848633e-07, 7.316470146179199e-06, 1.4387071132659912e-05, 2.1457672119140625e-05, 2.8528273105621338e-05, 3.559887409210205e-05, 4.2669475078582764e-05, 4.9740076065063477e-05, 5.681067705154419e-05, 6.38812780380249e-05, 7.095187902450562e-05, 7.802248001098633e-05, 8.509308099746704e-05, 9.216368198394775e-05, 9.923428297042847e-05, 0.00010630488395690918, 0.00011337548494338989, 0.0001204460859298706, 0.00012751668691635132, 0.00013458728790283203, 0.00014165788888931274, 0.00014872848987579346, 0.00015579909086227417, 0.00016286969184875488, 0.0001699402928352356, 0.0001770108938217163, 0.00018408149480819702, 0.00019115209579467773, 0.00019822269678115845, 0.00020529329776763916, 0.00021236389875411987, 0.00021943449974060059, 0.0002265051007270813, 0.000233575701713562, 0.00024064630270004272, 0.00024771690368652344]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 6.0, 10.0, 17.0, 7.0, 21.0, 11.0, 28.0, 53.0, 43.0, 35.0, 51.0, 42.0, 84.0, 58.0, 61.0, 52.0, 48.0, 51.0, 70.0, 22.0, 38.0, 30.0, 27.0, 19.0, 20.0, 14.0, 11.0, 9.0, 7.0, 11.0, 11.0, 8.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.76837158203125e-06, -4.6389177441596985e-06, -4.509463906288147e-06, -4.3800100684165955e-06, -4.250556230545044e-06, -4.1211023926734924e-06, -3.991648554801941e-06, -3.862194716930389e-06, -3.732740879058838e-06, -3.6032870411872864e-06, -3.473833203315735e-06, -3.3443793654441833e-06, -3.214925527572632e-06, -3.0854716897010803e-06, -2.956017851829529e-06, -2.8265640139579773e-06, -2.6971101760864258e-06, -2.5676563382148743e-06, -2.4382025003433228e-06, -2.3087486624717712e-06, -2.1792948246002197e-06, -2.0498409867286682e-06, -1.9203871488571167e-06, -1.7909333109855652e-06, -1.6614794731140137e-06, -1.5320256352424622e-06, -1.4025717973709106e-06, -1.2731179594993591e-06, -1.1436641216278076e-06, -1.014210283756256e-06, -8.847564458847046e-07, -7.553026080131531e-07, -6.258487701416016e-07, -4.9639493227005e-07, -3.6694109439849854e-07, -2.3748725652694702e-07, -1.0803341865539551e-07, 2.1420419216156006e-08, 1.5087425708770752e-07, 2.8032809495925903e-07, 4.0978193283081055e-07, 5.392357707023621e-07, 6.686896085739136e-07, 7.981434464454651e-07, 9.275972843170166e-07, 1.0570511221885681e-06, 1.1865049600601196e-06, 1.3159587979316711e-06, 1.4454126358032227e-06, 1.5748664736747742e-06, 1.7043203115463257e-06, 1.8337741494178772e-06, 1.9632279872894287e-06, 2.0926818251609802e-06, 2.2221356630325317e-06, 2.3515895009040833e-06, 2.4810433387756348e-06, 2.6104971766471863e-06, 2.739951014518738e-06, 2.8694048523902893e-06, 2.998858690261841e-06, 3.1283125281333923e-06, 3.257766366004944e-06, 3.3872202038764954e-06, 3.516674041748047e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 5.0, 14.0, 27.0, 37.0, 56.0, 109.0, 186.0, 502.0, 4629.0, 1038175.0, 3866.0, 475.0, 168.0, 88.0, 61.0, 34.0, 29.0, 26.0, 11.0, 7.0, 5.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003333091735839844, -0.0003223717212677002, -0.000311434268951416, -0.00030049681663513184, -0.00028955936431884766, -0.0002786219120025635, -0.0002676844596862793, -0.0002567470073699951, -0.00024580955505371094, -0.00023487210273742676, -0.00022393465042114258, -0.0002129971981048584, -0.00020205974578857422, -0.00019112229347229004, -0.00018018484115600586, -0.00016924738883972168, -0.0001583099365234375, -0.00014737248420715332, -0.00013643503189086914, -0.00012549757957458496, -0.00011456012725830078, -0.0001036226749420166, -9.268522262573242e-05, -8.174777030944824e-05, -7.081031799316406e-05, -5.987286567687988e-05, -4.89354133605957e-05, -3.7997961044311523e-05, -2.7060508728027344e-05, -1.6123056411743164e-05, -5.185604095458984e-06, 5.751848220825195e-06, 1.6689300537109375e-05, 2.7626752853393555e-05, 3.8564205169677734e-05, 4.9501657485961914e-05, 6.0439109802246094e-05, 7.137656211853027e-05, 8.231401443481445e-05, 9.325146675109863e-05, 0.00010418891906738281, 0.00011512637138366699, 0.00012606382369995117, 0.00013700127601623535, 0.00014793872833251953, 0.0001588761806488037, 0.0001698136329650879, 0.00018075108528137207, 0.00019168853759765625, 0.00020262598991394043, 0.0002135634422302246, 0.0002245008945465088, 0.00023543834686279297, 0.00024637579917907715, 0.00025731325149536133, 0.0002682507038116455, 0.0002791881561279297, 0.00029012560844421387, 0.00030106306076049805, 0.0003120005130767822, 0.0003229379653930664, 0.0003338754177093506, 0.00034481287002563477, 0.00035575032234191895, 0.0003666877746582031]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 2.0, 12.0, 18.0, 29.0, 41.0, 52.0, 60.0, 90.0, 112.0, 133.0, 98.0, 85.0, 58.0, 48.0, 43.0, 23.0, 21.0, 19.0, 11.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002956390380859375, -0.0002859383821487427, -0.00027623772621154785, -0.00026653707027435303, -0.0002568364143371582, -0.0002471357583999634, -0.00023743510246276855, -0.00022773444652557373, -0.0002180337905883789, -0.00020833313465118408, -0.00019863247871398926, -0.00018893182277679443, -0.0001792311668395996, -0.00016953051090240479, -0.00015982985496520996, -0.00015012919902801514, -0.0001404285430908203, -0.0001307278871536255, -0.00012102723121643066, -0.00011132657527923584, -0.00010162591934204102, -9.192526340484619e-05, -8.222460746765137e-05, -7.252395153045654e-05, -6.282329559326172e-05, -5.3122639656066895e-05, -4.342198371887207e-05, -3.3721327781677246e-05, -2.4020671844482422e-05, -1.4320015907287598e-05, -4.6193599700927734e-06, 5.081295967102051e-06, 1.4781951904296875e-05, 2.44826078414917e-05, 3.4183263778686523e-05, 4.388391971588135e-05, 5.358457565307617e-05, 6.3285231590271e-05, 7.298588752746582e-05, 8.268654346466064e-05, 9.238719940185547e-05, 0.00010208785533905029, 0.00011178851127624512, 0.00012148916721343994, 0.00013118982315063477, 0.0001408904790878296, 0.00015059113502502441, 0.00016029179096221924, 0.00016999244689941406, 0.0001796931028366089, 0.0001893937587738037, 0.00019909441471099854, 0.00020879507064819336, 0.00021849572658538818, 0.000228196382522583, 0.00023789703845977783, 0.00024759769439697266, 0.0002572983503341675, 0.0002669990062713623, 0.00027669966220855713, 0.00028640031814575195, 0.0002961009740829468, 0.0003058016300201416, 0.0003155022859573364, 0.00032520294189453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 124.0, 866.0, 22.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.83314323425293, -10.640776634216309, -10.448410034179688, -10.256043434143066, -10.063676834106445, -9.871310234069824, -9.678943634033203, -9.486577033996582, -9.294210433959961, -9.10184383392334, -8.909477233886719, -8.717110633850098, -8.524744033813477, -8.332377433776855, -8.140010833740234, -7.947644233703613, -7.755277156829834, -7.562910556793213, -7.370543956756592, -7.178177356719971, -6.98581075668335, -6.7934441566467285, -6.601077079772949, -6.408710479736328, -6.216343879699707, -6.023977279663086, -5.831610679626465, -5.639244079589844, -5.446877479553223, -5.254510879516602, -5.0621442794799805, -4.869777679443359, -4.6774115562438965, -4.485044956207275, -4.292678356170654, -4.100311756134033, -3.907945156097412, -3.715578556060791, -3.523211717605591, -3.3308451175689697, -3.1384785175323486, -2.9461119174957275, -2.7537453174591064, -2.5613784790039062, -2.369011878967285, -2.176645278930664, -1.984278678894043, -1.7919120788574219, -1.5995454788208008, -1.4071788787841797, -1.2148122787475586, -1.022445559501648, -0.8300789594650269, -0.6377123594284058, -0.4453456401824951, -0.252979040145874, -0.06061244010925293, 0.13175418972969055, 0.32412081956863403, 0.5164874792098999, 0.708854079246521, 0.9012206792831421, 1.0935873985290527, 1.2859539985656738, 1.478320598602295]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 11.0, 10.0, 22.0, 15.0, 16.0, 24.0, 30.0, 33.0, 36.0, 43.0, 33.0, 37.0, 49.0, 54.0, 57.0, 54.0, 52.0, 53.0, 57.0, 29.0, 36.0, 46.0, 26.0, 31.0, 21.0, 15.0, 25.0, 20.0, 15.0, 7.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.3956475257873535, -3.3011348247528076, -3.206622362136841, -3.112109661102295, -3.017596960067749, -2.9230844974517822, -2.8285717964172363, -2.7340593338012695, -2.6395466327667236, -2.5450339317321777, -2.450521469116211, -2.356008768081665, -2.261496067047119, -2.1669836044311523, -2.0724709033966064, -1.97795832157135, -1.8834456205368042, -1.7889330387115479, -1.694420337677002, -1.5999077558517456, -1.5053951740264893, -1.4108824729919434, -1.316369891166687, -1.2218573093414307, -1.1273446083068848, -1.0328320264816284, -0.9383193850517273, -0.8438067436218262, -0.7492941617965698, -0.6547815203666687, -0.5602688789367676, -0.46575629711151123, -0.3712437152862549, -0.27673110365867615, -0.18221847712993622, -0.08770585060119629, 0.006806761026382446, 0.10131937265396118, 0.1958320140838623, 0.29034459590911865, 0.3848572373390198, 0.4793698489665985, 0.5738824605941772, 0.6683951020240784, 0.7629077434539795, 0.8574203252792358, 0.951932966709137, 1.046445608139038, 1.1409581899642944, 1.2354707717895508, 1.3299834728240967, 1.424496054649353, 1.5190086364746094, 1.6135213375091553, 1.7080339193344116, 1.802546501159668, 1.8970592021942139, 1.9915717840194702, 2.0860843658447266, 2.1805970668792725, 2.2751097679138184, 2.369622230529785, 2.464134931564331, 2.558647632598877, 2.6531600952148438]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 3.0, 3.0, 7.0, 5.0, 3.0, 12.0, 8.0, 8.0, 7.0, 21.0, 71.0, 4193491.0, 291.0, 179.0, 62.0, 17.0, 9.0, 6.0, 6.0, 6.0, 11.0, 4.0, 3.0, 9.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0026302337646484375, -0.0025503933429718018, -0.002470552921295166, -0.0023907124996185303, -0.0023108720779418945, -0.002231031656265259, -0.002151191234588623, -0.0020713508129119873, -0.0019915103912353516, -0.0019116699695587158, -0.00183182954788208, -0.0017519891262054443, -0.0016721487045288086, -0.0015923082828521729, -0.0015124678611755371, -0.0014326274394989014, -0.0013527870178222656, -0.0012729465961456299, -0.0011931061744689941, -0.0011132657527923584, -0.0010334253311157227, -0.0009535849094390869, -0.0008737444877624512, -0.0007939040660858154, -0.0007140636444091797, -0.0006342232227325439, -0.0005543828010559082, -0.00047454237937927246, -0.0003947019577026367, -0.000314861536026001, -0.00023502111434936523, -0.0001551806926727295, -7.534027099609375e-05, 4.500150680541992e-06, 8.434057235717773e-05, 0.00016418099403381348, 0.00024402141571044922, 0.00032386183738708496, 0.0004037022590637207, 0.00048354268074035645, 0.0005633831024169922, 0.0006432235240936279, 0.0007230639457702637, 0.0008029043674468994, 0.0008827447891235352, 0.0009625852108001709, 0.0010424256324768066, 0.0011222660541534424, 0.0012021064758300781, 0.0012819468975067139, 0.0013617873191833496, 0.0014416277408599854, 0.001521468162536621, 0.0016013085842132568, 0.0016811490058898926, 0.0017609894275665283, 0.001840829849243164, 0.0019206702709197998, 0.0020005106925964355, 0.0020803511142730713, 0.002160191535949707, 0.0022400319576263428, 0.0023198723793029785, 0.0023997128009796143, 0.00247955322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 10.0, 8.0, 6.0, 6.0, 9.0, 14.0, 51.0, 159.0, 277.0, 231.0, 98.0, 22.0, 8.0, 6.0, 7.0, 13.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.171875, -0.16637039184570312, -0.16086578369140625, -0.15536117553710938, -0.1498565673828125, -0.14435195922851562, -0.13884735107421875, -0.13334274291992188, -0.127838134765625, -0.12233352661132812, -0.11682891845703125, -0.11132431030273438, -0.1058197021484375, -0.10031509399414062, -0.09481048583984375, -0.08930587768554688, -0.08380126953125, -0.07829666137695312, -0.07279205322265625, -0.06728744506835938, -0.0617828369140625, -0.056278228759765625, -0.05077362060546875, -0.045269012451171875, -0.039764404296875, -0.034259796142578125, -0.02875518798828125, -0.023250579833984375, -0.0177459716796875, -0.012241363525390625, -0.00673675537109375, -0.001232147216796875, 0.0042724609375, 0.009777069091796875, 0.01528167724609375, 0.020786285400390625, 0.0262908935546875, 0.031795501708984375, 0.03730010986328125, 0.042804718017578125, 0.048309326171875, 0.053813934326171875, 0.05931854248046875, 0.06482315063476562, 0.0703277587890625, 0.07583236694335938, 0.08133697509765625, 0.08684158325195312, 0.09234619140625, 0.09785079956054688, 0.10335540771484375, 0.10886001586914062, 0.1143646240234375, 0.11986923217773438, 0.12537384033203125, 0.13087844848632812, 0.136383056640625, 0.14188766479492188, 0.14739227294921875, 0.15289688110351562, 0.1584014892578125, 0.16390609741210938, 0.16941070556640625, 0.17491531372070312, 0.180419921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 14.0, 18.0, 31.0, 52.0, 86.0, 85.0, 96.0, 80.0, 4193377.0, 96.0, 103.0, 92.0, 73.0, 37.0, 35.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013427734375, -0.013033509254455566, -0.012639284133911133, -0.0122450590133667, -0.011850833892822266, -0.011456608772277832, -0.011062383651733398, -0.010668158531188965, -0.010273933410644531, -0.009879708290100098, -0.009485483169555664, -0.00909125804901123, -0.008697032928466797, -0.008302807807922363, -0.00790858268737793, -0.007514357566833496, -0.0071201324462890625, -0.006725907325744629, -0.006331682205200195, -0.005937457084655762, -0.005543231964111328, -0.0051490068435668945, -0.004754781723022461, -0.004360556602478027, -0.003966331481933594, -0.00357210636138916, -0.0031778812408447266, -0.002783656120300293, -0.0023894309997558594, -0.0019952058792114258, -0.0016009807586669922, -0.0012067556381225586, -0.000812530517578125, -0.0004183053970336914, -2.4080276489257812e-05, 0.0003701448440551758, 0.0007643699645996094, 0.001158595085144043, 0.0015528202056884766, 0.0019470453262329102, 0.0023412704467773438, 0.0027354955673217773, 0.003129720687866211, 0.0035239458084106445, 0.003918170928955078, 0.004312396049499512, 0.004706621170043945, 0.005100846290588379, 0.0054950714111328125, 0.005889296531677246, 0.00628352165222168, 0.006677746772766113, 0.007071971893310547, 0.0074661970138549805, 0.007860422134399414, 0.008254647254943848, 0.008648872375488281, 0.009043097496032715, 0.009437322616577148, 0.009831547737121582, 0.010225772857666016, 0.01061999797821045, 0.011014223098754883, 0.011408448219299316, 0.01180267333984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 6.139278411865234e-05, 0.0001227855682373047, 0.00018417835235595703, 0.0002455711364746094, 0.0003069639205932617, 0.00036835670471191406, 0.0004297494888305664, 0.0004911422729492188, 0.0005525350570678711, 0.0006139278411865234, 0.0006753206253051758, 0.0007367134094238281, 0.0007981061935424805, 0.0008594989776611328, 0.0009208917617797852, 0.0009822845458984375, 0.0010436773300170898, 0.0011050701141357422, 0.0011664628982543945, 0.0012278556823730469, 0.0012892484664916992, 0.0013506412506103516, 0.001412034034729004, 0.0014734268188476562, 0.0015348196029663086, 0.001596212387084961, 0.0016576051712036133, 0.0017189979553222656, 0.001780390739440918, 0.0018417835235595703, 0.0019031763076782227, 0.001964569091796875, 0.0020259618759155273, 0.0020873546600341797, 0.002148747444152832, 0.0022101402282714844, 0.0022715330123901367, 0.002332925796508789, 0.0023943185806274414, 0.0024557113647460938, 0.002517104148864746, 0.0025784969329833984, 0.0026398897171020508, 0.002701282501220703, 0.0027626752853393555, 0.002824068069458008, 0.00288546085357666, 0.0029468536376953125, 0.003008246421813965, 0.003069639205932617, 0.0031310319900512695, 0.003192424774169922, 0.0032538175582885742, 0.0033152103424072266, 0.003376603126525879, 0.0034379959106445312, 0.0034993886947631836, 0.003560781478881836, 0.0036221742630004883, 0.0036835670471191406, 0.003744959831237793, 0.0038063526153564453, 0.0038677453994750977, 0.00392913818359375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 999.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02179417386651039, -0.020748240873217583, -0.019702306017279625, -0.018656373023986816, -0.01761043816804886, -0.01656450517475605, -0.015518572181463242, -0.014472638256847858, -0.013426704332232475, -0.012380770407617092, -0.011334836483001709, -0.0102889034897089, -0.009242969565093517, -0.008197035640478134, -0.007151102181524038, -0.0061051687225699425, -0.005059234797954559, -0.004013300873339176, -0.0029673674143850803, -0.0019214337226003408, -0.0008755000308156013, 0.0001704338937997818, 0.0012163673527538776, 0.0022623008117079735, 0.0033082347363233566, 0.00435416866093874, 0.005400102119892836, 0.0064460355788469315, 0.007491969503462315, 0.008537903428077698, 0.009583836421370506, 0.01062977034598589, 0.011675707995891571, 0.012721641920506954, 0.013767575845122337, 0.014813508838415146, 0.015859443694353104, 0.016905376687645912, 0.01795130968093872, 0.01899724453687668, 0.020043177530169487, 0.021089110523462296, 0.022135045379400253, 0.023180978372693062, 0.02422691136598587, 0.025272846221923828, 0.026318779215216637, 0.027364712208509445, 0.028410647064447403, 0.02945658005774021, 0.03050251491367817, 0.03154844790697098, 0.032594382762908936, 0.03364031761884689, 0.03468624874949455, 0.03573218360543251, 0.03677811473608017, 0.03782404959201813, 0.03886998072266579, 0.039915915578603745, 0.0409618504345417, 0.04200778156518936, 0.04305371642112732, 0.04409965127706528, 0.045145586133003235]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 10.0, 19.0, 35.0, 72.0, 140.0, 193.0, 183.0, 137.0, 96.0, 52.0, 26.0, 19.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003452479839324951, -0.003274080343544483, -0.003095680847764015, -0.002917281351983547, -0.0027388818562030792, -0.0025604823604226112, -0.0023820828646421432, -0.0022036833688616753, -0.0020252838730812073, -0.0018468843773007393, -0.0016684848815202713, -0.0014900853857398033, -0.0013116858899593353, -0.0011332863941788673, -0.0009548868983983994, -0.0007764874026179314, -0.0005980879068374634, -0.0004196884110569954, -0.0002412889152765274, -6.288941949605942e-05, 0.00011551007628440857, 0.00029390957206487656, 0.00047230906784534454, 0.0006507085636258125, 0.0008291080594062805, 0.0010075075551867485, 0.0011859070509672165, 0.0013643065467476845, 0.0015427060425281525, 0.0017211055383086205, 0.0018995050340890884, 0.0020779045298695564, 0.0022563040256500244, 0.0024347035214304924, 0.0026131030172109604, 0.0027915025129914284, 0.0029699020087718964, 0.0031483015045523643, 0.0033267010003328323, 0.0035051004961133003, 0.0036834999918937683, 0.0038618994876742363, 0.004040298983454704, 0.004218698479235172, 0.00439709797501564, 0.004575497470796108, 0.004753896966576576, 0.004932296462357044, 0.005110695958137512, 0.00528909545391798, 0.005467494949698448, 0.005645894445478916, 0.005824293941259384, 0.006002693437039852, 0.00618109293282032, 0.006359492428600788, 0.006537891924381256, 0.006716291420161724, 0.006894690915942192, 0.00707309041172266, 0.007251489907503128, 0.007429889403283596, 0.007608288899064064, 0.007786688394844532, 0.007965087890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 7.0, 7.0, 15.0, 14.0, 7.0, 15.0, 22.0, 17.0, 25.0, 35.0, 38.0, 64.0, 97.0, 132.0, 208.0, 282.0, 414.0, 623.0, 913.0, 1750.0, 3684.0, 8635.0, 38145.0, 941417.0, 35517.0, 8454.0, 3396.0, 1690.0, 932.0, 615.0, 435.0, 307.0, 182.0, 138.0, 86.0, 47.0, 37.0, 32.0, 14.0, 17.0, 9.0, 12.0, 16.0, 7.0, 7.0, 6.0, 11.0, 2.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.30615234375, -0.2964286804199219, -0.28670501708984375, -0.2769813537597656, -0.2672576904296875, -0.2575340270996094, -0.24781036376953125, -0.23808670043945312, -0.228363037109375, -0.21863937377929688, -0.20891571044921875, -0.19919204711914062, -0.1894683837890625, -0.17974472045898438, -0.17002105712890625, -0.16029739379882812, -0.15057373046875, -0.14085006713867188, -0.13112640380859375, -0.12140274047851562, -0.1116790771484375, -0.10195541381835938, -0.09223175048828125, -0.08250808715820312, -0.072784423828125, -0.06306076049804688, -0.05333709716796875, -0.043613433837890625, -0.0338897705078125, -0.024166107177734375, -0.01444244384765625, -0.004718780517578125, 0.0050048828125, 0.014728546142578125, 0.02445220947265625, 0.034175872802734375, 0.0438995361328125, 0.053623199462890625, 0.06334686279296875, 0.07307052612304688, 0.082794189453125, 0.09251785278320312, 0.10224151611328125, 0.11196517944335938, 0.1216888427734375, 0.13141250610351562, 0.14113616943359375, 0.15085983276367188, 0.16058349609375, 0.17030715942382812, 0.18003082275390625, 0.18975448608398438, 0.1994781494140625, 0.20920181274414062, 0.21892547607421875, 0.22864913940429688, 0.238372802734375, 0.24809646606445312, 0.25782012939453125, 0.2675437927246094, 0.2772674560546875, 0.2869911193847656, 0.29671478271484375, 0.3064384460449219, 0.316162109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 10.0, 8.0, 6.0, 6.0, 9.0, 14.0, 51.0, 159.0, 277.0, 231.0, 98.0, 22.0, 8.0, 6.0, 7.0, 13.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.171875, -0.16637039184570312, -0.16086578369140625, -0.15536117553710938, -0.1498565673828125, -0.14435195922851562, -0.13884735107421875, -0.13334274291992188, -0.127838134765625, -0.12233352661132812, -0.11682891845703125, -0.11132431030273438, -0.1058197021484375, -0.10031509399414062, -0.09481048583984375, -0.08930587768554688, -0.08380126953125, -0.07829666137695312, -0.07279205322265625, -0.06728744506835938, -0.0617828369140625, -0.056278228759765625, -0.05077362060546875, -0.045269012451171875, -0.039764404296875, -0.034259796142578125, -0.02875518798828125, -0.023250579833984375, -0.0177459716796875, -0.012241363525390625, -0.00673675537109375, -0.001232147216796875, 0.0042724609375, 0.009777069091796875, 0.01528167724609375, 0.020786285400390625, 0.0262908935546875, 0.031795501708984375, 0.03730010986328125, 0.042804718017578125, 0.048309326171875, 0.053813934326171875, 0.05931854248046875, 0.06482315063476562, 0.0703277587890625, 0.07583236694335938, 0.08133697509765625, 0.08684158325195312, 0.09234619140625, 0.09785079956054688, 0.10335540771484375, 0.10886001586914062, 0.1143646240234375, 0.11986923217773438, 0.12537384033203125, 0.13087844848632812, 0.136383056640625, 0.14188766479492188, 0.14739227294921875, 0.15289688110351562, 0.1584014892578125, 0.16390609741210938, 0.16941070556640625, 0.17491531372070312, 0.180419921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 6.0, 4.0, 3.0, 14.0, 10.0, 17.0, 19.0, 23.0, 14.0, 32.0, 38.0, 42.0, 82.0, 102.0, 140.0, 225.0, 544.0, 1690.0, 92642.0, 948865.0, 2472.0, 636.0, 287.0, 175.0, 107.0, 81.0, 79.0, 41.0, 39.0, 29.0, 24.0, 19.0, 16.0, 13.0, 7.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6066131591796875, -0.585784912109375, -0.5649566650390625, -0.54412841796875, -0.5233001708984375, -0.502471923828125, -0.4816436767578125, -0.4608154296875, -0.4399871826171875, -0.419158935546875, -0.3983306884765625, -0.37750244140625, -0.3566741943359375, -0.335845947265625, -0.3150177001953125, -0.294189453125, -0.2733612060546875, -0.252532958984375, -0.2317047119140625, -0.21087646484375, -0.1900482177734375, -0.169219970703125, -0.1483917236328125, -0.1275634765625, -0.1067352294921875, -0.085906982421875, -0.0650787353515625, -0.04425048828125, -0.0234222412109375, -0.002593994140625, 0.0182342529296875, 0.0390625, 0.0598907470703125, 0.080718994140625, 0.1015472412109375, 0.12237548828125, 0.1432037353515625, 0.164031982421875, 0.1848602294921875, 0.2056884765625, 0.2265167236328125, 0.247344970703125, 0.2681732177734375, 0.28900146484375, 0.3098297119140625, 0.330657958984375, 0.3514862060546875, 0.372314453125, 0.3931427001953125, 0.413970947265625, 0.4347991943359375, 0.45562744140625, 0.4764556884765625, 0.497283935546875, 0.5181121826171875, 0.5389404296875, 0.5597686767578125, 0.580596923828125, 0.6014251708984375, 0.62225341796875, 0.6430816650390625, 0.663909912109375, 0.6847381591796875, 0.70556640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 6.0, 4.0, 2.0, 14.0, 10.0, 17.0, 18.0, 22.0, 12.0, 26.0, 32.0, 23.0, 46.0, 44.0, 31.0, 44.0, 45.0, 46.0, 53.0, 40.0, 55.0, 55.0, 44.0, 43.0, 30.0, 34.0, 41.0, 30.0, 23.0, 24.0, 19.0, 18.0, 16.0, 10.0, 8.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5078125, -0.49095916748046875, -0.4741058349609375, -0.45725250244140625, -0.440399169921875, -0.42354583740234375, -0.4066925048828125, -0.38983917236328125, -0.37298583984375, -0.35613250732421875, -0.3392791748046875, -0.32242584228515625, -0.305572509765625, -0.28871917724609375, -0.2718658447265625, -0.25501251220703125, -0.2381591796875, -0.22130584716796875, -0.2044525146484375, -0.18759918212890625, -0.170745849609375, -0.15389251708984375, -0.1370391845703125, -0.12018585205078125, -0.10333251953125, -0.08647918701171875, -0.0696258544921875, -0.05277252197265625, -0.035919189453125, -0.01906585693359375, -0.0022125244140625, 0.01464080810546875, 0.031494140625, 0.04834747314453125, 0.0652008056640625, 0.08205413818359375, 0.098907470703125, 0.11576080322265625, 0.1326141357421875, 0.14946746826171875, 0.16632080078125, 0.18317413330078125, 0.2000274658203125, 0.21688079833984375, 0.233734130859375, 0.25058746337890625, 0.2674407958984375, 0.28429412841796875, 0.3011474609375, 0.31800079345703125, 0.3348541259765625, 0.35170745849609375, 0.368560791015625, 0.38541412353515625, 0.4022674560546875, 0.41912078857421875, 0.43597412109375, 0.45282745361328125, 0.4696807861328125, 0.48653411865234375, 0.503387451171875, 0.5202407836914062, 0.5370941162109375, 0.5539474487304688, 0.57080078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 7.0, 8.0, 16.0, 26.0, 24.0, 41.0, 49.0, 98.0, 148.0, 217.0, 385.0, 727.0, 1426.0, 3398.0, 9316.0, 38242.0, 776414.0, 183255.0, 22982.0, 6712.0, 2484.0, 1125.0, 573.0, 323.0, 187.0, 112.0, 76.0, 38.0, 40.0, 29.0, 20.0, 5.0, 14.0, 11.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013744831085205078, -0.0001329910010099411, -0.00012853369116783142, -0.00012407638132572174, -0.00011961907148361206, -0.00011516176164150238, -0.0001107044517993927, -0.00010624714195728302, -0.00010178983211517334, -9.733252227306366e-05, -9.287521243095398e-05, -8.84179025888443e-05, -8.396059274673462e-05, -7.950328290462494e-05, -7.504597306251526e-05, -7.058866322040558e-05, -6.61313533782959e-05, -6.167404353618622e-05, -5.721673369407654e-05, -5.275942385196686e-05, -4.830211400985718e-05, -4.38448041677475e-05, -3.938749432563782e-05, -3.493018448352814e-05, -3.0472874641418457e-05, -2.6015564799308777e-05, -2.1558254957199097e-05, -1.7100945115089417e-05, -1.2643635272979736e-05, -8.186325430870056e-06, -3.729015588760376e-06, 7.282942533493042e-07, 5.185604095458984e-06, 9.642913937568665e-06, 1.4100223779678345e-05, 1.8557533621788025e-05, 2.3014843463897705e-05, 2.7472153306007385e-05, 3.1929463148117065e-05, 3.6386772990226746e-05, 4.0844082832336426e-05, 4.5301392674446106e-05, 4.9758702516555786e-05, 5.4216012358665466e-05, 5.8673322200775146e-05, 6.313063204288483e-05, 6.758794188499451e-05, 7.204525172710419e-05, 7.650256156921387e-05, 8.095987141132355e-05, 8.541718125343323e-05, 8.987449109554291e-05, 9.433180093765259e-05, 9.878911077976227e-05, 0.00010324642062187195, 0.00010770373046398163, 0.00011216104030609131, 0.00011661835014820099, 0.00012107565999031067, 0.00012553296983242035, 0.00012999027967453003, 0.0001344475895166397, 0.0001389048993587494, 0.00014336220920085907, 0.00014781951904296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 16.0, 9.0, 18.0, 18.0, 30.0, 34.0, 31.0, 35.0, 50.0, 90.0, 48.0, 51.0, 50.0, 54.0, 75.0, 39.0, 47.0, 59.0, 47.0, 20.0, 33.0, 24.0, 23.0, 22.0, 11.0, 8.0, 8.0, 8.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.9208680391311646e-06, -3.7886202335357666e-06, -3.6563724279403687e-06, -3.5241246223449707e-06, -3.3918768167495728e-06, -3.259629011154175e-06, -3.127381205558777e-06, -2.995133399963379e-06, -2.862885594367981e-06, -2.730637788772583e-06, -2.598389983177185e-06, -2.466142177581787e-06, -2.333894371986389e-06, -2.201646566390991e-06, -2.0693987607955933e-06, -1.9371509552001953e-06, -1.8049031496047974e-06, -1.6726553440093994e-06, -1.5404075384140015e-06, -1.4081597328186035e-06, -1.2759119272232056e-06, -1.1436641216278076e-06, -1.0114163160324097e-06, -8.791685104370117e-07, -7.469207048416138e-07, -6.146728992462158e-07, -4.824250936508179e-07, -3.501772880554199e-07, -2.1792948246002197e-07, -8.568167686462402e-08, 4.6566128730773926e-08, 1.7881393432617188e-07, 3.110617399215698e-07, 4.4330954551696777e-07, 5.755573511123657e-07, 7.078051567077637e-07, 8.400529623031616e-07, 9.723007678985596e-07, 1.1045485734939575e-06, 1.2367963790893555e-06, 1.3690441846847534e-06, 1.5012919902801514e-06, 1.6335397958755493e-06, 1.7657876014709473e-06, 1.8980354070663452e-06, 2.030283212661743e-06, 2.162531018257141e-06, 2.294778823852539e-06, 2.427026629447937e-06, 2.559274435043335e-06, 2.691522240638733e-06, 2.823770046234131e-06, 2.956017851829529e-06, 3.0882656574249268e-06, 3.2205134630203247e-06, 3.3527612686157227e-06, 3.4850090742111206e-06, 3.6172568798065186e-06, 3.7495046854019165e-06, 3.8817524909973145e-06, 4.014000296592712e-06, 4.14624810218811e-06, 4.278495907783508e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 2.0, 15.0, 12.0, 17.0, 24.0, 38.0, 49.0, 87.0, 153.0, 388.0, 1781.0, 1035449.0, 9356.0, 613.0, 226.0, 102.0, 75.0, 34.0, 32.0, 22.0, 14.0, 7.0, 12.0, 5.0, 7.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005459785461425781, -0.000527597963809967, -0.000509217381477356, -0.0004908367991447449, -0.0004724562168121338, -0.0004540756344795227, -0.0004356950521469116, -0.00041731446981430054, -0.00039893388748168945, -0.00038055330514907837, -0.0003621727228164673, -0.0003437921404838562, -0.0003254115581512451, -0.00030703097581863403, -0.00028865039348602295, -0.00027026981115341187, -0.0002518892288208008, -0.0002335086464881897, -0.0002151280641555786, -0.00019674748182296753, -0.00017836689949035645, -0.00015998631715774536, -0.00014160573482513428, -0.0001232251524925232, -0.00010484457015991211, -8.646398782730103e-05, -6.808340549468994e-05, -4.970282316207886e-05, -3.1322240829467773e-05, -1.294165849685669e-05, 5.4389238357543945e-06, 2.381950616836548e-05, 4.220008850097656e-05, 6.0580670833587646e-05, 7.896125316619873e-05, 9.734183549880981e-05, 0.0001157224178314209, 0.00013410300016403198, 0.00015248358249664307, 0.00017086416482925415, 0.00018924474716186523, 0.00020762532949447632, 0.0002260059118270874, 0.0002443864941596985, 0.00026276707649230957, 0.00028114765882492065, 0.00029952824115753174, 0.0003179088234901428, 0.0003362894058227539, 0.000354669988155365, 0.0003730505704879761, 0.00039143115282058716, 0.00040981173515319824, 0.0004281923174858093, 0.0004465728998184204, 0.0004649534821510315, 0.0004833340644836426, 0.0005017146468162537, 0.0005200952291488647, 0.0005384758114814758, 0.0005568563938140869, 0.000575236976146698, 0.0005936175584793091, 0.0006119981408119202, 0.0006303787231445312]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 2.0, 12.0, 10.0, 12.0, 13.0, 25.0, 23.0, 35.0, 43.0, 69.0, 112.0, 182.0, 142.0, 83.0, 57.0, 42.0, 26.0, 17.0, 21.0, 15.0, 9.0, 5.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004420280456542969, -0.00042714923620224, -0.0004122704267501831, -0.0003973916172981262, -0.00038251280784606934, -0.00036763399839401245, -0.00035275518894195557, -0.0003378763794898987, -0.0003229975700378418, -0.0003081187605857849, -0.00029323995113372803, -0.00027836114168167114, -0.00026348233222961426, -0.0002486035227775574, -0.0002337247133255005, -0.0002188459038734436, -0.00020396709442138672, -0.00018908828496932983, -0.00017420947551727295, -0.00015933066606521606, -0.00014445185661315918, -0.0001295730471611023, -0.00011469423770904541, -9.981542825698853e-05, -8.493661880493164e-05, -7.005780935287476e-05, -5.517899990081787e-05, -4.0300190448760986e-05, -2.54213809967041e-05, -1.0542571544647217e-05, 4.336237907409668e-06, 1.9215047359466553e-05, 3.409385681152344e-05, 4.897266626358032e-05, 6.385147571563721e-05, 7.873028516769409e-05, 9.360909461975098e-05, 0.00010848790407180786, 0.00012336671352386475, 0.00013824552297592163, 0.00015312433242797852, 0.0001680031418800354, 0.00018288195133209229, 0.00019776076078414917, 0.00021263957023620605, 0.00022751837968826294, 0.00024239718914031982, 0.0002572759985923767, 0.0002721548080444336, 0.0002870336174964905, 0.00030191242694854736, 0.00031679123640060425, 0.00033167004585266113, 0.000346548855304718, 0.0003614276647567749, 0.0003763064742088318, 0.00039118528366088867, 0.00040606409311294556, 0.00042094290256500244, 0.0004358217120170593, 0.0004507005214691162, 0.0004655793309211731, 0.00048045814037323, 0.0004953369498252869, 0.0005102157592773438]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 15.0, 813.0, 179.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.30239486694336, -8.125077247619629, -7.947759628295898, -7.770442008972168, -7.5931243896484375, -7.415807247161865, -7.238489627838135, -7.061172008514404, -6.883854389190674, -6.706536769866943, -6.529219150543213, -6.351901531219482, -6.17458438873291, -5.99726676940918, -5.819949150085449, -5.642631530761719, -5.465313911437988, -5.287996292114258, -5.110678672790527, -4.933361053466797, -4.756043434143066, -4.578726291656494, -4.401408672332764, -4.224091053009033, -4.046773433685303, -3.8694558143615723, -3.692138195037842, -3.5148208141326904, -3.33750319480896, -3.1601855754852295, -2.982868194580078, -2.8055505752563477, -2.628232955932617, -2.4509153366088867, -2.2735977172851562, -2.096280336380005, -1.9189627170562744, -1.741645097732544, -1.564327597618103, -1.387010097503662, -1.2096924781799316, -1.0323748588562012, -0.8550573587417603, -0.6777397990226746, -0.5004222393035889, -0.3231046795845032, -0.14578711986541748, 0.03153038024902344, 0.2088479995727539, 0.3861655592918396, 0.5634831190109253, 0.740800678730011, 0.9181182384490967, 1.0954358577728271, 1.272753357887268, 1.450070858001709, 1.6273884773254395, 1.80470609664917, 1.9820235967636108, 2.1593410968780518, 2.3366587162017822, 2.5139763355255127, 2.691293716430664, 2.8686113357543945, 3.045928955078125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 8.0, 10.0, 7.0, 13.0, 16.0, 18.0, 17.0, 23.0, 20.0, 20.0, 33.0, 32.0, 55.0, 47.0, 47.0, 55.0, 54.0, 74.0, 58.0, 50.0, 45.0, 50.0, 38.0, 40.0, 31.0, 26.0, 16.0, 24.0, 16.0, 11.0, 11.0, 9.0, 4.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.377265453338623, -3.287642002105713, -3.198018789291382, -3.1083953380584717, -3.0187718868255615, -2.9291486740112305, -2.8395252227783203, -2.74990177154541, -2.6602783203125, -2.57065486907959, -2.481031656265259, -2.3914082050323486, -2.3017847537994385, -2.2121615409851074, -2.1225380897521973, -2.032914638519287, -1.943291425704956, -1.8536680936813354, -1.7640446424484253, -1.6744213104248047, -1.5847978591918945, -1.495174527168274, -1.4055511951446533, -1.3159277439117432, -1.2263044118881226, -1.136681079864502, -1.0470576286315918, -0.9574342966079712, -0.8678109049797058, -0.7781875133514404, -0.6885641813278198, -0.5989407896995544, -0.5093173980712891, -0.4196940064430237, -0.3300706446170807, -0.2404472827911377, -0.15082389116287231, -0.061200499534606934, 0.028422832489013672, 0.11804622411727905, 0.20766961574554443, 0.2972930073738098, 0.3869163691997528, 0.4765397310256958, 0.5661631226539612, 0.6557865142822266, 0.7454098463058472, 0.8350332379341125, 0.9246566295623779, 1.0142799615859985, 1.1039034128189087, 1.1935267448425293, 1.2831501960754395, 1.37277352809906, 1.4623968601226807, 1.5520203113555908, 1.6416436433792114, 1.731266975402832, 1.8208904266357422, 1.9105137586593628, 2.0001370906829834, 2.0897605419158936, 2.1793837547302246, 2.2690072059631348, 2.358630657196045]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 7.0, 4.0, 5.0, 3.0, 12.0, 8.0, 7.0, 9.0, 25.0, 134.0, 4193484.0, 281.0, 148.0, 45.0, 15.0, 8.0, 6.0, 7.0, 6.0, 10.0, 4.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0300750732421875, -0.02915358543395996, -0.028232097625732422, -0.027310609817504883, -0.026389122009277344, -0.025467634201049805, -0.024546146392822266, -0.023624658584594727, -0.022703170776367188, -0.02178168296813965, -0.02086019515991211, -0.01993870735168457, -0.01901721954345703, -0.018095731735229492, -0.017174243927001953, -0.016252756118774414, -0.015331268310546875, -0.014409780502319336, -0.013488292694091797, -0.012566804885864258, -0.011645317077636719, -0.01072382926940918, -0.00980234146118164, -0.008880853652954102, -0.007959365844726562, -0.0070378780364990234, -0.006116390228271484, -0.005194902420043945, -0.004273414611816406, -0.003351926803588867, -0.002430438995361328, -0.001508951187133789, -0.00058746337890625, 0.00033402442932128906, 0.0012555122375488281, 0.002177000045776367, 0.0030984878540039062, 0.004019975662231445, 0.004941463470458984, 0.0058629512786865234, 0.0067844390869140625, 0.0077059268951416016, 0.00862741470336914, 0.00954890251159668, 0.010470390319824219, 0.011391878128051758, 0.012313365936279297, 0.013234853744506836, 0.014156341552734375, 0.015077829360961914, 0.015999317169189453, 0.016920804977416992, 0.01784229278564453, 0.01876378059387207, 0.01968526840209961, 0.02060675621032715, 0.021528244018554688, 0.022449731826782227, 0.023371219635009766, 0.024292707443237305, 0.025214195251464844, 0.026135683059692383, 0.027057170867919922, 0.02797865867614746, 0.028900146484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 4.0, 10.0, 7.0, 5.0, 7.0, 8.0, 15.0, 45.0, 148.0, 251.0, 253.0, 116.0, 24.0, 9.0, 7.0, 8.0, 12.0, 3.0, 5.0, 4.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1715087890625, -0.16603851318359375, -0.1605682373046875, -0.15509796142578125, -0.149627685546875, -0.14415740966796875, -0.1386871337890625, -0.13321685791015625, -0.12774658203125, -0.12227630615234375, -0.1168060302734375, -0.11133575439453125, -0.105865478515625, -0.10039520263671875, -0.0949249267578125, -0.08945465087890625, -0.083984375, -0.07851409912109375, -0.0730438232421875, -0.06757354736328125, -0.062103271484375, -0.05663299560546875, -0.0511627197265625, -0.04569244384765625, -0.04022216796875, -0.03475189208984375, -0.0292816162109375, -0.02381134033203125, -0.018341064453125, -0.01287078857421875, -0.0074005126953125, -0.00193023681640625, 0.0035400390625, 0.00901031494140625, 0.0144805908203125, 0.01995086669921875, 0.025421142578125, 0.03089141845703125, 0.0363616943359375, 0.04183197021484375, 0.04730224609375, 0.05277252197265625, 0.0582427978515625, 0.06371307373046875, 0.069183349609375, 0.07465362548828125, 0.0801239013671875, 0.08559417724609375, 0.091064453125, 0.09653472900390625, 0.1020050048828125, 0.10747528076171875, 0.112945556640625, 0.11841583251953125, 0.1238861083984375, 0.12935638427734375, 0.13482666015625, 0.14029693603515625, 0.1457672119140625, 0.15123748779296875, 0.156707763671875, 0.16217803955078125, 0.1676483154296875, 0.17311859130859375, 0.1785888671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 28.0, 56.0, 133.0, 248.0, 442.0, 705.0, 4190854.0, 807.0, 490.0, 249.0, 125.0, 73.0, 27.0, 16.0, 10.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021419525146484375, -0.002083510160446167, -0.0020250678062438965, -0.001966625452041626, -0.0019081830978393555, -0.001849740743637085, -0.0017912983894348145, -0.001732856035232544, -0.0016744136810302734, -0.001615971326828003, -0.0015575289726257324, -0.001499086618423462, -0.0014406442642211914, -0.001382201910018921, -0.0013237595558166504, -0.0012653172016143799, -0.0012068748474121094, -0.0011484324932098389, -0.0010899901390075684, -0.0010315477848052979, -0.0009731054306030273, -0.0009146630764007568, -0.0008562207221984863, -0.0007977783679962158, -0.0007393360137939453, -0.0006808936595916748, -0.0006224513053894043, -0.0005640089511871338, -0.0005055665969848633, -0.0004471242427825928, -0.00038868188858032227, -0.00033023953437805176, -0.00027179718017578125, -0.00021335482597351074, -0.00015491247177124023, -9.647011756896973e-05, -3.802776336669922e-05, 2.041459083557129e-05, 7.88569450378418e-05, 0.0001372992992401123, 0.0001957416534423828, 0.0002541840076446533, 0.00031262636184692383, 0.00037106871604919434, 0.00042951107025146484, 0.00048795342445373535, 0.0005463957786560059, 0.0006048381328582764, 0.0006632804870605469, 0.0007217228412628174, 0.0007801651954650879, 0.0008386075496673584, 0.0008970499038696289, 0.0009554922580718994, 0.00101393461227417, 0.0010723769664764404, 0.001130819320678711, 0.0011892616748809814, 0.001247704029083252, 0.0013061463832855225, 0.001364588737487793, 0.0014230310916900635, 0.001481473445892334, 0.0015399158000946045, 0.001598358154296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4087.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003199577331542969, -0.00030507147312164307, -0.00029018521308898926, -0.00027529895305633545, -0.00026041269302368164, -0.00024552643299102783, -0.00023064017295837402, -0.00021575391292572021, -0.0002008676528930664, -0.0001859813928604126, -0.0001710951328277588, -0.00015620887279510498, -0.00014132261276245117, -0.00012643635272979736, -0.00011155009269714355, -9.666383266448975e-05, -8.177757263183594e-05, -6.689131259918213e-05, -5.200505256652832e-05, -3.711879253387451e-05, -2.2232532501220703e-05, -7.3462724685668945e-06, 7.539987564086914e-06, 2.2426247596740723e-05, 3.731250762939453e-05, 5.219876766204834e-05, 6.708502769470215e-05, 8.197128772735596e-05, 9.685754776000977e-05, 0.00011174380779266357, 0.00012663006782531738, 0.0001415163278579712, 0.000156402587890625, 0.0001712888479232788, 0.00018617510795593262, 0.00020106136798858643, 0.00021594762802124023, 0.00023083388805389404, 0.00024572014808654785, 0.00026060640811920166, 0.00027549266815185547, 0.0002903789281845093, 0.0003052651882171631, 0.0003201514482498169, 0.0003350377082824707, 0.0003499239683151245, 0.0003648102283477783, 0.00037969648838043213, 0.00039458274841308594, 0.00040946900844573975, 0.00042435526847839355, 0.00043924152851104736, 0.00045412778854370117, 0.000469014048576355, 0.0004839003086090088, 0.0004987865686416626, 0.0005136728286743164, 0.0005285590887069702, 0.000543445348739624, 0.0005583316087722778, 0.0005732178688049316, 0.0005881041288375854, 0.0006029903888702393, 0.0006178766489028931, 0.0006327629089355469]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1001.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004166252911090851, -0.004025673493742943, -0.0038850936107337475, -0.003744513960555196, -0.003603934310376644, -0.003463354893028736, -0.0033227752428501844, -0.0031821955926716328, -0.003041615942493081, -0.0029010362923145294, -0.0027604566421359777, -0.002619876991957426, -0.002479297574609518, -0.0023387176916003227, -0.0021981382742524147, -0.002057558624073863, -0.0019169789738953114, -0.0017763993237167597, -0.001635819673538208, -0.0014952401397749782, -0.0013546604895964265, -0.0012140808394178748, -0.001073501305654645, -0.0009329216554760933, -0.0007923420052975416, -0.0006517623551189899, -0.0005111827631480992, -0.00037060314207337797, -0.00023002352099865675, -8.944387082010508e-05, 5.1135721150785685e-05, 0.00019171531312167645, 0.0003322944976389408, 0.00047287411871366203, 0.0006134537397883832, 0.000754033331759274, 0.0008946129819378257, 0.0010351926321163774, 0.0011757721658796072, 0.0013163518160581589, 0.0014569314662367105, 0.0015975111164152622, 0.001738090766593814, 0.0018786703003570437, 0.0020192498341202736, 0.002159829717129469, 0.002300409134477377, 0.0024409887846559286, 0.0025815684348344803, 0.002722148085013032, 0.0028627277351915836, 0.0030033073853701353, 0.003143887035548687, 0.003284466452896595, 0.0034250461030751467, 0.0035656257532536983, 0.00370620540343225, 0.0038467850536108017, 0.00398736447095871, 0.004127944353967905, 0.004268523771315813, 0.004409103654325008, 0.004549683071672916, 0.004690262489020824, 0.00483084237203002]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 11.0, 27.0, 74.0, 79.0, 124.0, 144.0, 124.0, 144.0, 104.0, 63.0, 44.0, 28.0, 13.0, 3.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009211897850036621, -0.000885901041328907, -0.0008506122976541519, -0.0008153235539793968, -0.0007800348103046417, -0.0007447460666298866, -0.0007094573229551315, -0.0006741685792803764, -0.0006388798356056213, -0.0006035910919308662, -0.0005683023482561111, -0.000533013604581356, -0.000497724860906601, -0.00046243611723184586, -0.00042714737355709076, -0.00039185862988233566, -0.00035656988620758057, -0.00032128114253282547, -0.0002859923988580704, -0.0002507036551833153, -0.00021541491150856018, -0.00018012616783380508, -0.00014483742415905, -0.00010954868048429489, -7.42599368095398e-05, -3.89711931347847e-05, -3.682449460029602e-06, 3.1606294214725494e-05, 6.689503788948059e-05, 0.00010218378156423569, 0.00013747252523899078, 0.00017276126891374588, 0.00020805001258850098, 0.00024333875626325607, 0.00027862749993801117, 0.00031391624361276627, 0.00034920498728752136, 0.00038449373096227646, 0.00041978247463703156, 0.00045507121831178665, 0.0004903599619865417, 0.0005256487056612968, 0.0005609374493360519, 0.000596226193010807, 0.0006315149366855621, 0.0006668036803603172, 0.0007020924240350723, 0.0007373811677098274, 0.0007726699113845825, 0.0008079586550593376, 0.0008432473987340927, 0.0008785361424088478, 0.0009138248860836029, 0.000949113629758358, 0.000984402373433113, 0.0010196911171078682, 0.0010549798607826233, 0.0010902686044573784, 0.0011255573481321335, 0.0011608460918068886, 0.0011961348354816437, 0.0012314235791563988, 0.0012667123228311539, 0.001302001066505909, 0.001337289810180664]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 7.0, 9.0, 14.0, 12.0, 30.0, 32.0, 29.0, 40.0, 56.0, 52.0, 77.0, 103.0, 102.0, 147.0, 183.0, 245.0, 414.0, 616.0, 1067.0, 1666.0, 2825.0, 5444.0, 13306.0, 64820.0, 904141.0, 32037.0, 9985.0, 4349.0, 2287.0, 1457.0, 901.0, 588.0, 386.0, 283.0, 180.0, 153.0, 104.0, 84.0, 59.0, 47.0, 50.0, 24.0, 24.0, 21.0, 19.0, 16.0, 11.0, 13.0, 13.0, 0.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.287353515625, -0.2781867980957031, -0.26902008056640625, -0.2598533630371094, -0.2506866455078125, -0.24151992797851562, -0.23235321044921875, -0.22318649291992188, -0.214019775390625, -0.20485305786132812, -0.19568634033203125, -0.18651962280273438, -0.1773529052734375, -0.16818618774414062, -0.15901947021484375, -0.14985275268554688, -0.14068603515625, -0.13151931762695312, -0.12235260009765625, -0.11318588256835938, -0.1040191650390625, -0.09485244750976562, -0.08568572998046875, -0.07651901245117188, -0.067352294921875, -0.058185577392578125, -0.04901885986328125, -0.039852142333984375, -0.0306854248046875, -0.021518707275390625, -0.01235198974609375, -0.003185272216796875, 0.0059814453125, 0.015148162841796875, 0.02431488037109375, 0.033481597900390625, 0.0426483154296875, 0.051815032958984375, 0.06098175048828125, 0.07014846801757812, 0.079315185546875, 0.08848190307617188, 0.09764862060546875, 0.10681533813476562, 0.1159820556640625, 0.12514877319335938, 0.13431549072265625, 0.14348220825195312, 0.15264892578125, 0.16181564331054688, 0.17098236083984375, 0.18014907836914062, 0.1893157958984375, 0.19848251342773438, 0.20764923095703125, 0.21681594848632812, 0.225982666015625, 0.23514938354492188, 0.24431610107421875, 0.2534828186035156, 0.2626495361328125, 0.2718162536621094, 0.28098297119140625, 0.2901496887207031, 0.29931640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 4.0, 10.0, 7.0, 5.0, 7.0, 8.0, 15.0, 45.0, 148.0, 251.0, 253.0, 116.0, 24.0, 9.0, 7.0, 8.0, 12.0, 3.0, 5.0, 4.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1715087890625, -0.16603851318359375, -0.1605682373046875, -0.15509796142578125, -0.149627685546875, -0.14415740966796875, -0.1386871337890625, -0.13321685791015625, -0.12774658203125, -0.12227630615234375, -0.1168060302734375, -0.11133575439453125, -0.105865478515625, -0.10039520263671875, -0.0949249267578125, -0.08945465087890625, -0.083984375, -0.07851409912109375, -0.0730438232421875, -0.06757354736328125, -0.062103271484375, -0.05663299560546875, -0.0511627197265625, -0.04569244384765625, -0.04022216796875, -0.03475189208984375, -0.0292816162109375, -0.02381134033203125, -0.018341064453125, -0.01287078857421875, -0.0074005126953125, -0.00193023681640625, 0.0035400390625, 0.00901031494140625, 0.0144805908203125, 0.01995086669921875, 0.025421142578125, 0.03089141845703125, 0.0363616943359375, 0.04183197021484375, 0.04730224609375, 0.05277252197265625, 0.0582427978515625, 0.06371307373046875, 0.069183349609375, 0.07465362548828125, 0.0801239013671875, 0.08559417724609375, 0.091064453125, 0.09653472900390625, 0.1020050048828125, 0.10747528076171875, 0.112945556640625, 0.11841583251953125, 0.1238861083984375, 0.12935638427734375, 0.13482666015625, 0.14029693603515625, 0.1457672119140625, 0.15123748779296875, 0.156707763671875, 0.16217803955078125, 0.1676483154296875, 0.17311859130859375, 0.1785888671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 8.0, 7.0, 11.0, 12.0, 13.0, 26.0, 27.0, 16.0, 32.0, 37.0, 61.0, 60.0, 93.0, 164.0, 332.0, 819.0, 2840.0, 907269.0, 132981.0, 2120.0, 741.0, 329.0, 171.0, 90.0, 61.0, 43.0, 29.0, 24.0, 19.0, 18.0, 16.0, 8.0, 11.0, 10.0, 5.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65234375, -0.6312408447265625, -0.610137939453125, -0.5890350341796875, -0.56793212890625, -0.5468292236328125, -0.525726318359375, -0.5046234130859375, -0.4835205078125, -0.4624176025390625, -0.441314697265625, -0.4202117919921875, -0.39910888671875, -0.3780059814453125, -0.356903076171875, -0.3358001708984375, -0.314697265625, -0.2935943603515625, -0.272491455078125, -0.2513885498046875, -0.23028564453125, -0.2091827392578125, -0.188079833984375, -0.1669769287109375, -0.1458740234375, -0.1247711181640625, -0.103668212890625, -0.0825653076171875, -0.06146240234375, -0.0403594970703125, -0.019256591796875, 0.0018463134765625, 0.02294921875, 0.0440521240234375, 0.065155029296875, 0.0862579345703125, 0.10736083984375, 0.1284637451171875, 0.149566650390625, 0.1706695556640625, 0.1917724609375, 0.2128753662109375, 0.233978271484375, 0.2550811767578125, 0.27618408203125, 0.2972869873046875, 0.318389892578125, 0.3394927978515625, 0.360595703125, 0.3816986083984375, 0.402801513671875, 0.4239044189453125, 0.44500732421875, 0.4661102294921875, 0.487213134765625, 0.5083160400390625, 0.5294189453125, 0.5505218505859375, 0.571624755859375, 0.5927276611328125, 0.61383056640625, 0.6349334716796875, 0.656036376953125, 0.6771392822265625, 0.6982421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 4.0, 4.0, 9.0, 7.0, 7.0, 11.0, 12.0, 13.0, 25.0, 26.0, 15.0, 28.0, 29.0, 43.0, 34.0, 40.0, 40.0, 38.0, 42.0, 49.0, 47.0, 36.0, 47.0, 40.0, 52.0, 43.0, 39.0, 34.0, 28.0, 25.0, 16.0, 18.0, 16.0, 16.0, 8.0, 11.0, 11.0, 4.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.44342803955078125, -0.4286041259765625, -0.41378021240234375, -0.398956298828125, -0.38413238525390625, -0.3693084716796875, -0.35448455810546875, -0.33966064453125, -0.32483673095703125, -0.3100128173828125, -0.29518890380859375, -0.280364990234375, -0.26554107666015625, -0.2507171630859375, -0.23589324951171875, -0.2210693359375, -0.20624542236328125, -0.1914215087890625, -0.17659759521484375, -0.161773681640625, -0.14694976806640625, -0.1321258544921875, -0.11730194091796875, -0.10247802734375, -0.08765411376953125, -0.0728302001953125, -0.05800628662109375, -0.043182373046875, -0.02835845947265625, -0.0135345458984375, 0.00128936767578125, 0.01611328125, 0.03093719482421875, 0.0457611083984375, 0.06058502197265625, 0.075408935546875, 0.09023284912109375, 0.1050567626953125, 0.11988067626953125, 0.13470458984375, 0.14952850341796875, 0.1643524169921875, 0.17917633056640625, 0.194000244140625, 0.20882415771484375, 0.2236480712890625, 0.23847198486328125, 0.2532958984375, 0.26811981201171875, 0.2829437255859375, 0.29776763916015625, 0.312591552734375, 0.32741546630859375, 0.3422393798828125, 0.35706329345703125, 0.37188720703125, 0.38671112060546875, 0.4015350341796875, 0.41635894775390625, 0.431182861328125, 0.44600677490234375, 0.4608306884765625, 0.47565460205078125, 0.490478515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 3.0, 11.0, 9.0, 18.0, 30.0, 33.0, 40.0, 90.0, 145.0, 219.0, 386.0, 777.0, 2048.0, 6809.0, 34685.0, 862712.0, 120631.0, 13723.0, 3667.0, 1253.0, 541.0, 285.0, 160.0, 94.0, 62.0, 43.0, 21.0, 19.0, 11.0, 6.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011152029037475586, -0.00010718870908021927, -0.00010285712778568268, -9.852554649114609e-05, -9.41939651966095e-05, -8.98623839020729e-05, -8.553080260753632e-05, -8.119922131299973e-05, -7.686764001846313e-05, -7.253605872392654e-05, -6.820447742938995e-05, -6.387289613485336e-05, -5.954131484031677e-05, -5.520973354578018e-05, -5.087815225124359e-05, -4.6546570956707e-05, -4.221498966217041e-05, -3.788340836763382e-05, -3.355182707309723e-05, -2.922024577856064e-05, -2.4888664484024048e-05, -2.0557083189487457e-05, -1.6225501894950867e-05, -1.1893920600414276e-05, -7.5623393058776855e-06, -3.230758011341095e-06, 1.1008232831954956e-06, 5.432404577732086e-06, 9.763985872268677e-06, 1.4095567166805267e-05, 1.8427148461341858e-05, 2.275872975587845e-05, 2.709031105041504e-05, 3.142189234495163e-05, 3.575347363948822e-05, 4.008505493402481e-05, 4.44166362285614e-05, 4.874821752309799e-05, 5.307979881763458e-05, 5.741138011217117e-05, 6.174296140670776e-05, 6.607454270124435e-05, 7.040612399578094e-05, 7.473770529031754e-05, 7.906928658485413e-05, 8.340086787939072e-05, 8.773244917392731e-05, 9.20640304684639e-05, 9.639561176300049e-05, 0.00010072719305753708, 0.00010505877435207367, 0.00010939035564661026, 0.00011372193694114685, 0.00011805351823568344, 0.00012238509953022003, 0.00012671668082475662, 0.0001310482621192932, 0.0001353798434138298, 0.0001397114247083664, 0.00014404300600290298, 0.00014837458729743958, 0.00015270616859197617, 0.00015703774988651276, 0.00016136933118104935, 0.00016570091247558594]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 2.0, 9.0, 4.0, 18.0, 20.0, 7.0, 11.0, 16.0, 32.0, 26.0, 46.0, 23.0, 48.0, 28.0, 60.0, 65.0, 26.0, 69.0, 37.0, 76.0, 30.0, 63.0, 25.0, 57.0, 28.0, 33.0, 29.0, 16.0, 26.0, 9.0, 15.0, 8.0, 8.0, 4.0, 8.0, 2.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.2186508178710938e-06, -3.1264498829841614e-06, -3.034248948097229e-06, -2.9420480132102966e-06, -2.8498470783233643e-06, -2.757646143436432e-06, -2.6654452085494995e-06, -2.573244273662567e-06, -2.4810433387756348e-06, -2.3888424038887024e-06, -2.29664146900177e-06, -2.2044405341148376e-06, -2.1122395992279053e-06, -2.020038664340973e-06, -1.9278377294540405e-06, -1.8356367945671082e-06, -1.7434358596801758e-06, -1.6512349247932434e-06, -1.559033989906311e-06, -1.4668330550193787e-06, -1.3746321201324463e-06, -1.282431185245514e-06, -1.1902302503585815e-06, -1.0980293154716492e-06, -1.0058283805847168e-06, -9.136274456977844e-07, -8.21426510810852e-07, -7.292255759239197e-07, -6.370246410369873e-07, -5.448237061500549e-07, -4.5262277126312256e-07, -3.604218363761902e-07, -2.682209014892578e-07, -1.7601996660232544e-07, -8.381903171539307e-08, 8.381903171539307e-09, 1.0058283805847168e-07, 1.9278377294540405e-07, 2.849847078323364e-07, 3.771856427192688e-07, 4.6938657760620117e-07, 5.615875124931335e-07, 6.537884473800659e-07, 7.459893822669983e-07, 8.381903171539307e-07, 9.30391252040863e-07, 1.0225921869277954e-06, 1.1147931218147278e-06, 1.2069940567016602e-06, 1.2991949915885925e-06, 1.391395926475525e-06, 1.4835968613624573e-06, 1.5757977962493896e-06, 1.667998731136322e-06, 1.7601996660232544e-06, 1.8524006009101868e-06, 1.944601535797119e-06, 2.0368024706840515e-06, 2.129003405570984e-06, 2.2212043404579163e-06, 2.3134052753448486e-06, 2.405606210231781e-06, 2.4978071451187134e-06, 2.5900080800056458e-06, 2.682209014892578e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 8.0, 6.0, 11.0, 12.0, 19.0, 22.0, 36.0, 73.0, 155.0, 462.0, 3866.0, 1041382.0, 1885.0, 318.0, 125.0, 62.0, 33.0, 24.0, 15.0, 10.0, 7.0, 12.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041365623474121094, -0.00039231404662132263, -0.0003709718585014343, -0.000349629670381546, -0.0003282874822616577, -0.0003069452941417694, -0.0002856031060218811, -0.0002642609179019928, -0.0002429187297821045, -0.0002215765416622162, -0.00020023435354232788, -0.00017889216542243958, -0.00015754997730255127, -0.00013620778918266296, -0.00011486560106277466, -9.352341294288635e-05, -7.218122482299805e-05, -5.083903670310974e-05, -2.9496848583221436e-05, -8.15466046333313e-06, 1.3187527656555176e-05, 3.452971577644348e-05, 5.587190389633179e-05, 7.721409201622009e-05, 9.85562801361084e-05, 0.0001198984682559967, 0.000141240656375885, 0.00016258284449577332, 0.00018392503261566162, 0.00020526722073554993, 0.00022660940885543823, 0.00024795159697532654, 0.00026929378509521484, 0.00029063597321510315, 0.00031197816133499146, 0.00033332034945487976, 0.00035466253757476807, 0.00037600472569465637, 0.0003973469138145447, 0.000418689101934433, 0.0004400312900543213, 0.0004613734781742096, 0.0004827156662940979, 0.0005040578544139862, 0.0005254000425338745, 0.0005467422306537628, 0.0005680844187736511, 0.0005894266068935394, 0.0006107687950134277, 0.000632110983133316, 0.0006534531712532043, 0.0006747953593730927, 0.000696137547492981, 0.0007174797356128693, 0.0007388219237327576, 0.0007601641118526459, 0.0007815062999725342, 0.0008028484880924225, 0.0008241906762123108, 0.0008455328643321991, 0.0008668750524520874, 0.0008882172405719757, 0.000909559428691864, 0.0009309016168117523, 0.0009522438049316406]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 10.0, 10.0, 16.0, 16.0, 27.0, 44.0, 59.0, 87.0, 148.0, 199.0, 131.0, 63.0, 53.0, 38.0, 28.0, 16.0, 8.0, 10.0, 7.0, 12.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002906322479248047, -0.00027563050389289856, -0.00026062875986099243, -0.0002456270158290863, -0.00023062527179718018, -0.00021562352776527405, -0.00020062178373336792, -0.0001856200397014618, -0.00017061829566955566, -0.00015561655163764954, -0.0001406148076057434, -0.00012561306357383728, -0.00011061131954193115, -9.560957551002502e-05, -8.06078314781189e-05, -6.560608744621277e-05, -5.060434341430664e-05, -3.560259938240051e-05, -2.0600855350494385e-05, -5.599111318588257e-06, 9.402632713317871e-06, 2.4404376745224e-05, 3.940612077713013e-05, 5.4407864809036255e-05, 6.940960884094238e-05, 8.441135287284851e-05, 9.941309690475464e-05, 0.00011441484093666077, 0.0001294165849685669, 0.00014441832900047302, 0.00015942007303237915, 0.00017442181706428528, 0.0001894235610961914, 0.00020442530512809753, 0.00021942704916000366, 0.0002344287931919098, 0.0002494305372238159, 0.00026443228125572205, 0.0002794340252876282, 0.0002944357693195343, 0.00030943751335144043, 0.00032443925738334656, 0.0003394410014152527, 0.0003544427454471588, 0.00036944448947906494, 0.00038444623351097107, 0.0003994479775428772, 0.0004144497215747833, 0.00042945146560668945, 0.0004444532096385956, 0.0004594549536705017, 0.00047445669770240784, 0.000489458441734314, 0.0005044601857662201, 0.0005194619297981262, 0.0005344636738300323, 0.0005494654178619385, 0.0005644671618938446, 0.0005794689059257507, 0.0005944706499576569, 0.000609472393989563, 0.0006244741380214691, 0.0006394758820533752, 0.0006544776260852814, 0.0006694793701171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 38.0, 768.0, 183.0, 22.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43006646633148193, -0.31518658995628357, -0.200306698679924, -0.08542680740356445, 0.02945306897163391, 0.14433294534683228, 0.259212851524353, 0.374092698097229, 0.48897260427474976, 0.6038525104522705, 0.7187323570251465, 0.8336122632026672, 0.948492169380188, 1.063372015953064, 1.1782519817352295, 1.2931318283081055, 1.4080116748809814, 1.5228915214538574, 1.637771487236023, 1.752651333808899, 1.867531180381775, 1.9824111461639404, 2.0972909927368164, 2.2121708393096924, 2.3270506858825684, 2.4419305324554443, 2.5568103790283203, 2.6716904640197754, 2.7865703105926514, 2.9014501571655273, 3.0163300037384033, 3.1312098503112793, 3.2460896968841553, 3.3609695434570312, 3.4758493900299072, 3.590729236602783, 3.7056093215942383, 3.8204891681671143, 3.9353690147399902, 4.050249099731445, 4.165128707885742, 4.280008792877197, 4.394888401031494, 4.509768486022949, 4.624648094177246, 4.739528179168701, 4.854408264160156, 4.969287872314453, 5.084167957305908, 5.199048042297363, 5.31392765045166, 5.428807735443115, 5.543687343597412, 5.658567428588867, 5.773447036743164, 5.888327121734619, 6.003206729888916, 6.118086814880371, 6.232966423034668, 6.347846508026123, 6.46272611618042, 6.577606201171875, 6.692485809326172, 6.807365894317627, 6.922245979309082]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 4.0, 10.0, 18.0, 21.0, 11.0, 17.0, 30.0, 23.0, 35.0, 35.0, 40.0, 43.0, 49.0, 36.0, 57.0, 58.0, 47.0, 60.0, 58.0, 57.0, 30.0, 27.0, 39.0, 25.0, 21.0, 19.0, 17.0, 23.0, 6.0, 12.0, 17.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5887110233306885, -2.510352373123169, -2.4319934844970703, -2.353634834289551, -2.2752761840820312, -2.1969175338745117, -2.118558883666992, -2.0401999950408936, -1.961841344833374, -1.8834826946258545, -1.8051239252090454, -1.7267651557922363, -1.6484065055847168, -1.5700478553771973, -1.4916890859603882, -1.413330316543579, -1.3349716663360596, -1.25661301612854, -1.178254246711731, -1.0998954772949219, -1.0215368270874023, -0.943178117275238, -0.8648194074630737, -0.7864606976509094, -0.7081019878387451, -0.6297432780265808, -0.5513845682144165, -0.4730258584022522, -0.3946671485900879, -0.3163084387779236, -0.23794972896575928, -0.15959101915359497, -0.08123254776000977, -0.002873837947845459, 0.07548487186431885, 0.15384358167648315, 0.23220229148864746, 0.31056100130081177, 0.3889197111129761, 0.4672784209251404, 0.5456371307373047, 0.623995840549469, 0.7023545503616333, 0.7807132601737976, 0.8590719699859619, 0.9374306797981262, 1.0157893896102905, 1.0941481590270996, 1.1725068092346191, 1.2508654594421387, 1.3292242288589478, 1.4075829982757568, 1.4859416484832764, 1.564300298690796, 1.642659068107605, 1.721017837524414, 1.7993764877319336, 1.8777351379394531, 1.9560939073562622, 2.0344526767730713, 2.112811326980591, 2.1911699771881104, 2.269528865814209, 2.3478875160217285, 2.426246166229248]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 5.0, 4.0, 6.0, 11.0, 6.0, 9.0, 6.0, 31.0, 122.0, 4193525.0, 256.0, 139.0, 46.0, 16.0, 7.0, 7.0, 7.0, 5.0, 11.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0254364013671875, -0.02465653419494629, -0.023876667022705078, -0.023096799850463867, -0.022316932678222656, -0.021537065505981445, -0.020757198333740234, -0.019977331161499023, -0.019197463989257812, -0.0184175968170166, -0.01763772964477539, -0.01685786247253418, -0.01607799530029297, -0.015298128128051758, -0.014518260955810547, -0.013738393783569336, -0.012958526611328125, -0.012178659439086914, -0.011398792266845703, -0.010618925094604492, -0.009839057922363281, -0.00905919075012207, -0.00827932357788086, -0.0074994564056396484, -0.0067195892333984375, -0.0059397220611572266, -0.005159854888916016, -0.004379987716674805, -0.0036001205444335938, -0.002820253372192383, -0.002040386199951172, -0.001260519027709961, -0.00048065185546875, 0.00029921531677246094, 0.0010790824890136719, 0.0018589496612548828, 0.0026388168334960938, 0.0034186840057373047, 0.004198551177978516, 0.0049784183502197266, 0.0057582855224609375, 0.0065381526947021484, 0.007318019866943359, 0.00809788703918457, 0.008877754211425781, 0.009657621383666992, 0.010437488555908203, 0.011217355728149414, 0.011997222900390625, 0.012777090072631836, 0.013556957244873047, 0.014336824417114258, 0.015116691589355469, 0.01589655876159668, 0.01667642593383789, 0.0174562931060791, 0.018236160278320312, 0.019016027450561523, 0.019795894622802734, 0.020575761795043945, 0.021355628967285156, 0.022135496139526367, 0.022915363311767578, 0.02369523048400879, 0.02447509765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 3.0, 11.0, 4.0, 9.0, 6.0, 7.0, 16.0, 45.0, 136.0, 246.0, 258.0, 123.0, 30.0, 7.0, 9.0, 6.0, 11.0, 6.0, 4.0, 4.0, 7.0, 3.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171142578125, -0.16569137573242188, -0.16024017333984375, -0.15478897094726562, -0.1493377685546875, -0.14388656616210938, -0.13843536376953125, -0.13298416137695312, -0.127532958984375, -0.12208175659179688, -0.11663055419921875, -0.11117935180664062, -0.1057281494140625, -0.10027694702148438, -0.09482574462890625, -0.08937454223632812, -0.08392333984375, -0.07847213745117188, -0.07302093505859375, -0.06756973266601562, -0.0621185302734375, -0.056667327880859375, -0.05121612548828125, -0.045764923095703125, -0.040313720703125, -0.034862518310546875, -0.02941131591796875, -0.023960113525390625, -0.0185089111328125, -0.013057708740234375, -0.00760650634765625, -0.002155303955078125, 0.0032958984375, 0.008747100830078125, 0.01419830322265625, 0.019649505615234375, 0.0251007080078125, 0.030551910400390625, 0.03600311279296875, 0.041454315185546875, 0.046905517578125, 0.052356719970703125, 0.05780792236328125, 0.06325912475585938, 0.0687103271484375, 0.07416152954101562, 0.07961273193359375, 0.08506393432617188, 0.09051513671875, 0.09596633911132812, 0.10141754150390625, 0.10686874389648438, 0.1123199462890625, 0.11777114868164062, 0.12322235107421875, 0.12867355346679688, 0.134124755859375, 0.13957595825195312, 0.14502716064453125, 0.15047836303710938, 0.1559295654296875, 0.16138076782226562, 0.16683197021484375, 0.17228317260742188, 0.177734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 18.0, 34.0, 50.0, 104.0, 137.0, 122.0, 4193404.0, 126.0, 102.0, 80.0, 56.0, 28.0, 12.0, 9.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03277587890625, -0.032003164291381836, -0.031230449676513672, -0.030457735061645508, -0.029685020446777344, -0.02891230583190918, -0.028139591217041016, -0.02736687660217285, -0.026594161987304688, -0.025821447372436523, -0.02504873275756836, -0.024276018142700195, -0.02350330352783203, -0.022730588912963867, -0.021957874298095703, -0.02118515968322754, -0.020412445068359375, -0.01963973045349121, -0.018867015838623047, -0.018094301223754883, -0.01732158660888672, -0.016548871994018555, -0.01577615737915039, -0.015003442764282227, -0.014230728149414062, -0.013458013534545898, -0.012685298919677734, -0.01191258430480957, -0.011139869689941406, -0.010367155075073242, -0.009594440460205078, -0.008821725845336914, -0.00804901123046875, -0.007276296615600586, -0.006503582000732422, -0.005730867385864258, -0.004958152770996094, -0.00418543815612793, -0.0034127235412597656, -0.0026400089263916016, -0.0018672943115234375, -0.0010945796966552734, -0.0003218650817871094, 0.0004508495330810547, 0.0012235641479492188, 0.001996278762817383, 0.002768993377685547, 0.003541707992553711, 0.004314422607421875, 0.005087137222290039, 0.005859851837158203, 0.006632566452026367, 0.007405281066894531, 0.008177995681762695, 0.00895071029663086, 0.009723424911499023, 0.010496139526367188, 0.011268854141235352, 0.012041568756103516, 0.01281428337097168, 0.013586997985839844, 0.014359712600708008, 0.015132427215576172, 0.015905141830444336, 0.0166778564453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4094.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609325408935547e-05, 9.716860949993134e-05, 0.00021043047308921814, 0.00032369233667850494, 0.00043695420026779175, 0.0005502160638570786, 0.0006634779274463654, 0.0007767397910356522, 0.000890001654624939, 0.0010032635182142258, 0.0011165253818035126, 0.0012297872453927994, 0.0013430491089820862, 0.001456310972571373, 0.0015695728361606598, 0.0016828346997499466, 0.0017960965633392334, 0.0019093584269285202, 0.002022620290517807, 0.002135882154107094, 0.0022491440176963806, 0.0023624058812856674, 0.0024756677448749542, 0.002588929608464241, 0.002702191472053528, 0.0028154533356428146, 0.0029287151992321014, 0.0030419770628213882, 0.003155238926410675, 0.003268500789999962, 0.0033817626535892487, 0.0034950245171785355, 0.0036082863807678223, 0.003721548244357109, 0.003834810107946396, 0.003948071971535683, 0.0040613338351249695, 0.004174595698714256, 0.004287857562303543, 0.00440111942589283, 0.004514381289482117, 0.0046276431530714035, 0.00474090501666069, 0.004854166880249977, 0.004967428743839264, 0.005080690607428551, 0.0051939524710178375, 0.005307214334607124, 0.005420476198196411, 0.005533738061785698, 0.005646999925374985, 0.0057602617889642715, 0.005873523652553558, 0.005986785516142845, 0.006100047379732132, 0.006213309243321419, 0.006326571106910706, 0.006439832970499992, 0.006553094834089279, 0.006666356697678566, 0.006779618561267853, 0.00689288042485714, 0.007006142288446426, 0.007119404152035713, 0.007232666015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 993.0, 17.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028130456805229187, -0.02724401466548443, -0.02635757066309452, -0.025471128523349762, -0.024584686383605003, -0.023698244243860245, -0.022811800241470337, -0.02192535810172558, -0.02103891596198082, -0.02015247382223606, -0.019266029819846153, -0.018379587680101395, -0.017493145540356636, -0.016606703400611877, -0.01572025939822197, -0.014833817258477211, -0.013947373256087303, -0.01306093018501997, -0.012174488045275211, -0.011288044974207878, -0.01040160283446312, -0.009515159763395786, -0.008628716692328453, -0.007742274086922407, -0.006855831481516361, -0.005969388876110315, -0.005082946270704269, -0.004196503199636936, -0.0033100605942308903, -0.0024236179888248444, -0.0015371749177575111, -0.0006507323123514652, 0.00023570843040943146, 0.0011221511522307992, 0.002008593874052167, 0.0028950367122888565, 0.0037814793176949024, 0.004667921923100948, 0.0055543649941682816, 0.0064408075995743275, 0.007327250204980373, 0.008213693276047707, 0.009100135415792465, 0.009986578486859798, 0.010873021557927132, 0.01175946369767189, 0.012645906768739223, 0.013532349839806557, 0.014418791979551315, 0.015305235050618649, 0.016191678121685982, 0.01707812026143074, 0.0179645624011755, 0.018851004540920258, 0.019737448543310165, 0.020623890683054924, 0.021510332822799683, 0.02239677496254444, 0.02328321896493435, 0.024169661104679108, 0.025056103244423866, 0.025942545384168625, 0.026828989386558533, 0.02771543152630329, 0.0286018755286932]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 12.0, 18.0, 63.0, 129.0, 170.0, 201.0, 182.0, 105.0, 69.0, 24.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006092369556427002, -0.005763119086623192, -0.005433868616819382, -0.005104618147015572, -0.0047753676772117615, -0.004446117207407951, -0.004116866737604141, -0.003787616267800331, -0.003458365797996521, -0.003129115328192711, -0.0027998648583889008, -0.0024706143885850906, -0.0021413639187812805, -0.0018121134489774704, -0.0014828629791736603, -0.0011536125093698502, -0.00082436203956604, -0.0004951115697622299, -0.0001658610999584198, 0.00016338936984539032, 0.0004926398396492004, 0.0008218903094530106, 0.0011511407792568207, 0.0014803912490606308, 0.001809641718864441, 0.002138892188668251, 0.002468142658472061, 0.0027973931282758713, 0.0031266435980796814, 0.0034558940678834915, 0.0037851445376873016, 0.004114395007491112, 0.004443645477294922, 0.004772895947098732, 0.005102146416902542, 0.005431396886706352, 0.005760647356510162, 0.0060898978263139725, 0.006419148296117783, 0.006748398765921593, 0.007077649235725403, 0.007406899705529213, 0.007736150175333023, 0.008065400645136833, 0.008394651114940643, 0.008723901584744453, 0.009053152054548264, 0.009382402524352074, 0.009711652994155884, 0.010040903463959694, 0.010370153933763504, 0.010699404403567314, 0.011028654873371124, 0.011357905343174934, 0.011687155812978745, 0.012016406282782555, 0.012345656752586365, 0.012674907222390175, 0.013004157692193985, 0.013333408161997795, 0.013662658631801605, 0.013991909101605415, 0.014321159571409225, 0.014650410041213036, 0.014979660511016846]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 2.0, 7.0, 8.0, 6.0, 8.0, 11.0, 18.0, 23.0, 70.0, 151.0, 278.0, 552.0, 1285.0, 3845.0, 18787.0, 983238.0, 32401.0, 5063.0, 1543.0, 593.0, 267.0, 141.0, 85.0, 42.0, 29.0, 14.0, 14.0, 14.0, 6.0, 13.0, 5.0, 5.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.63092041015625, -0.6109619140625, -0.59100341796875, -0.571044921875, -0.55108642578125, -0.5311279296875, -0.51116943359375, -0.4912109375, -0.47125244140625, -0.4512939453125, -0.43133544921875, -0.411376953125, -0.39141845703125, -0.3714599609375, -0.35150146484375, -0.33154296875, -0.31158447265625, -0.2916259765625, -0.27166748046875, -0.251708984375, -0.23175048828125, -0.2117919921875, -0.19183349609375, -0.171875, -0.15191650390625, -0.1319580078125, -0.11199951171875, -0.092041015625, -0.07208251953125, -0.0521240234375, -0.03216552734375, -0.01220703125, 0.00775146484375, 0.0277099609375, 0.04766845703125, 0.067626953125, 0.08758544921875, 0.1075439453125, 0.12750244140625, 0.1474609375, 0.16741943359375, 0.1873779296875, 0.20733642578125, 0.227294921875, 0.24725341796875, 0.2672119140625, 0.28717041015625, 0.30712890625, 0.32708740234375, 0.3470458984375, 0.36700439453125, 0.386962890625, 0.40692138671875, 0.4268798828125, 0.44683837890625, 0.466796875, 0.48675537109375, 0.5067138671875, 0.52667236328125, 0.546630859375, 0.56658935546875, 0.5865478515625, 0.60650634765625, 0.62646484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 3.0, 11.0, 4.0, 9.0, 6.0, 7.0, 16.0, 45.0, 136.0, 246.0, 258.0, 123.0, 30.0, 7.0, 9.0, 6.0, 11.0, 6.0, 4.0, 4.0, 7.0, 3.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171142578125, -0.16569137573242188, -0.16024017333984375, -0.15478897094726562, -0.1493377685546875, -0.14388656616210938, -0.13843536376953125, -0.13298416137695312, -0.127532958984375, -0.12208175659179688, -0.11663055419921875, -0.11117935180664062, -0.1057281494140625, -0.10027694702148438, -0.09482574462890625, -0.08937454223632812, -0.08392333984375, -0.07847213745117188, -0.07302093505859375, -0.06756973266601562, -0.0621185302734375, -0.056667327880859375, -0.05121612548828125, -0.045764923095703125, -0.040313720703125, -0.034862518310546875, -0.02941131591796875, -0.023960113525390625, -0.0185089111328125, -0.013057708740234375, -0.00760650634765625, -0.002155303955078125, 0.0032958984375, 0.008747100830078125, 0.01419830322265625, 0.019649505615234375, 0.0251007080078125, 0.030551910400390625, 0.03600311279296875, 0.041454315185546875, 0.046905517578125, 0.052356719970703125, 0.05780792236328125, 0.06325912475585938, 0.0687103271484375, 0.07416152954101562, 0.07961273193359375, 0.08506393432617188, 0.09051513671875, 0.09596633911132812, 0.10141754150390625, 0.10686874389648438, 0.1123199462890625, 0.11777114868164062, 0.12322235107421875, 0.12867355346679688, 0.134124755859375, 0.13957595825195312, 0.14502716064453125, 0.15047836303710938, 0.1559295654296875, 0.16138076782226562, 0.16683197021484375, 0.17228317260742188, 0.177734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 11.0, 10.0, 13.0, 12.0, 10.0, 8.0, 13.0, 20.0, 24.0, 32.0, 28.0, 46.0, 46.0, 103.0, 168.0, 325.0, 607.0, 1385.0, 14092.0, 1021219.0, 7746.0, 1293.0, 513.0, 275.0, 150.0, 52.0, 49.0, 32.0, 26.0, 25.0, 23.0, 19.0, 28.0, 21.0, 20.0, 10.0, 7.0, 13.0, 11.0, 11.0, 5.0, 8.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.5107421875, -0.4944915771484375, -0.478240966796875, -0.4619903564453125, -0.44573974609375, -0.4294891357421875, -0.413238525390625, -0.3969879150390625, -0.3807373046875, -0.3644866943359375, -0.348236083984375, -0.3319854736328125, -0.31573486328125, -0.2994842529296875, -0.283233642578125, -0.2669830322265625, -0.250732421875, -0.2344818115234375, -0.218231201171875, -0.2019805908203125, -0.18572998046875, -0.1694793701171875, -0.153228759765625, -0.1369781494140625, -0.1207275390625, -0.1044769287109375, -0.088226318359375, -0.0719757080078125, -0.05572509765625, -0.0394744873046875, -0.023223876953125, -0.0069732666015625, 0.00927734375, 0.0255279541015625, 0.041778564453125, 0.0580291748046875, 0.07427978515625, 0.0905303955078125, 0.106781005859375, 0.1230316162109375, 0.1392822265625, 0.1555328369140625, 0.171783447265625, 0.1880340576171875, 0.20428466796875, 0.2205352783203125, 0.236785888671875, 0.2530364990234375, 0.269287109375, 0.2855377197265625, 0.301788330078125, 0.3180389404296875, 0.33428955078125, 0.3505401611328125, 0.366790771484375, 0.3830413818359375, 0.3992919921875, 0.4155426025390625, 0.431793212890625, 0.4480438232421875, 0.46429443359375, 0.4805450439453125, 0.496795654296875, 0.5130462646484375, 0.529296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 11.0, 10.0, 13.0, 12.0, 10.0, 8.0, 14.0, 19.0, 24.0, 33.0, 27.0, 37.0, 34.0, 39.0, 26.0, 30.0, 35.0, 39.0, 32.0, 28.0, 32.0, 34.0, 42.0, 27.0, 31.0, 20.0, 34.0, 29.0, 26.0, 25.0, 23.0, 19.0, 28.0, 21.0, 20.0, 10.0, 7.0, 13.0, 12.0, 10.0, 5.0, 8.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.358642578125, -0.34722900390625, -0.3358154296875, -0.32440185546875, -0.31298828125, -0.30157470703125, -0.2901611328125, -0.27874755859375, -0.267333984375, -0.25592041015625, -0.2445068359375, -0.23309326171875, -0.2216796875, -0.21026611328125, -0.1988525390625, -0.18743896484375, -0.176025390625, -0.16461181640625, -0.1531982421875, -0.14178466796875, -0.13037109375, -0.11895751953125, -0.1075439453125, -0.09613037109375, -0.084716796875, -0.07330322265625, -0.0618896484375, -0.05047607421875, -0.0390625, -0.02764892578125, -0.0162353515625, -0.00482177734375, 0.006591796875, 0.01800537109375, 0.0294189453125, 0.04083251953125, 0.05224609375, 0.06365966796875, 0.0750732421875, 0.08648681640625, 0.097900390625, 0.10931396484375, 0.1207275390625, 0.13214111328125, 0.1435546875, 0.15496826171875, 0.1663818359375, 0.17779541015625, 0.189208984375, 0.20062255859375, 0.2120361328125, 0.22344970703125, 0.23486328125, 0.24627685546875, 0.2576904296875, 0.26910400390625, 0.280517578125, 0.29193115234375, 0.3033447265625, 0.31475830078125, 0.326171875, 0.33758544921875, 0.3489990234375, 0.36041259765625, 0.371826171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 5.0, 5.0, 12.0, 18.0, 26.0, 17.0, 44.0, 72.0, 85.0, 120.0, 221.0, 395.0, 801.0, 2034.0, 6684.0, 40786.0, 947459.0, 39147.0, 6786.0, 2004.0, 821.0, 369.0, 222.0, 129.0, 88.0, 49.0, 24.0, 32.0, 17.0, 13.0, 10.0, 15.0, 8.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010496377944946289, -0.00010084640234708786, -9.672902524471283e-05, -9.26116481423378e-05, -8.849427103996277e-05, -8.437689393758774e-05, -8.025951683521271e-05, -7.614213973283768e-05, -7.202476263046265e-05, -6.790738552808762e-05, -6.379000842571259e-05, -5.9672631323337555e-05, -5.5555254220962524e-05, -5.1437877118587494e-05, -4.732050001621246e-05, -4.320312291383743e-05, -3.90857458114624e-05, -3.496836870908737e-05, -3.085099160671234e-05, -2.673361450433731e-05, -2.261623740196228e-05, -1.849886029958725e-05, -1.438148319721222e-05, -1.0264106094837189e-05, -6.146728992462158e-06, -2.0293518900871277e-06, 2.088025212287903e-06, 6.205402314662933e-06, 1.0322779417037964e-05, 1.4440156519412994e-05, 1.8557533621788025e-05, 2.2674910724163055e-05, 2.6792287826538086e-05, 3.0909664928913116e-05, 3.502704203128815e-05, 3.914441913366318e-05, 4.326179623603821e-05, 4.737917333841324e-05, 5.149655044078827e-05, 5.56139275431633e-05, 5.973130464553833e-05, 6.384868174791336e-05, 6.796605885028839e-05, 7.208343595266342e-05, 7.620081305503845e-05, 8.031819015741348e-05, 8.443556725978851e-05, 8.855294436216354e-05, 9.267032146453857e-05, 9.67876985669136e-05, 0.00010090507566928864, 0.00010502245277166367, 0.0001091398298740387, 0.00011325720697641373, 0.00011737458407878876, 0.00012149196118116379, 0.00012560933828353882, 0.00012972671538591385, 0.00013384409248828888, 0.0001379614695906639, 0.00014207884669303894, 0.00014619622379541397, 0.000150313600897789, 0.00015443097800016403, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 6.0, 12.0, 13.0, 29.0, 23.0, 44.0, 58.0, 45.0, 58.0, 58.0, 83.0, 96.0, 73.0, 94.0, 48.0, 76.0, 38.0, 36.0, 42.0, 17.0, 18.0, 7.0, 10.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.112720489501953e-06, -3.958120942115784e-06, -3.8035213947296143e-06, -3.648921847343445e-06, -3.4943222999572754e-06, -3.339722752571106e-06, -3.1851232051849365e-06, -3.030523657798767e-06, -2.8759241104125977e-06, -2.7213245630264282e-06, -2.566725015640259e-06, -2.4121254682540894e-06, -2.25752592086792e-06, -2.1029263734817505e-06, -1.948326826095581e-06, -1.7937272787094116e-06, -1.6391277313232422e-06, -1.4845281839370728e-06, -1.3299286365509033e-06, -1.1753290891647339e-06, -1.0207295417785645e-06, -8.66129994392395e-07, -7.115304470062256e-07, -5.569308996200562e-07, -4.023313522338867e-07, -2.477318048477173e-07, -9.313225746154785e-08, 6.146728992462158e-08, 2.1606683731079102e-07, 3.7066638469696045e-07, 5.252659320831299e-07, 6.798654794692993e-07, 8.344650268554688e-07, 9.890645742416382e-07, 1.1436641216278076e-06, 1.298263669013977e-06, 1.4528632164001465e-06, 1.607462763786316e-06, 1.7620623111724854e-06, 1.9166618585586548e-06, 2.0712614059448242e-06, 2.2258609533309937e-06, 2.380460500717163e-06, 2.5350600481033325e-06, 2.689659595489502e-06, 2.8442591428756714e-06, 2.998858690261841e-06, 3.1534582376480103e-06, 3.3080577850341797e-06, 3.462657332420349e-06, 3.6172568798065186e-06, 3.771856427192688e-06, 3.926455974578857e-06, 4.081055521965027e-06, 4.235655069351196e-06, 4.390254616737366e-06, 4.544854164123535e-06, 4.699453711509705e-06, 4.854053258895874e-06, 5.0086528062820435e-06, 5.163252353668213e-06, 5.317851901054382e-06, 5.472451448440552e-06, 5.627050995826721e-06, 5.781650543212891e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 10.0, 8.0, 24.0, 28.0, 60.0, 130.0, 235.0, 1342.0, 1040754.0, 5206.0, 412.0, 142.0, 61.0, 39.0, 27.0, 13.0, 9.0, 7.0, 2.0, 5.0, 3.0, 0.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00052642822265625, -0.0005098059773445129, -0.0004931837320327759, -0.0004765614867210388, -0.00045993924140930176, -0.0004433169960975647, -0.00042669475078582764, -0.0004100725054740906, -0.0003934502601623535, -0.00037682801485061646, -0.0003602057695388794, -0.00034358352422714233, -0.0003269612789154053, -0.0003103390336036682, -0.00029371678829193115, -0.0002770945429801941, -0.00026047229766845703, -0.00024385005235671997, -0.0002272278070449829, -0.00021060556173324585, -0.0001939833164215088, -0.00017736107110977173, -0.00016073882579803467, -0.0001441165804862976, -0.00012749433517456055, -0.00011087208986282349, -9.424984455108643e-05, -7.762759923934937e-05, -6.1005353927612305e-05, -4.4383108615875244e-05, -2.7760863304138184e-05, -1.1138617992401123e-05, 5.4836273193359375e-06, 2.2105872631072998e-05, 3.872811794281006e-05, 5.535036325454712e-05, 7.197260856628418e-05, 8.859485387802124e-05, 0.0001052170991897583, 0.00012183934450149536, 0.00013846158981323242, 0.00015508383512496948, 0.00017170608043670654, 0.0001883283257484436, 0.00020495057106018066, 0.00022157281637191772, 0.00023819506168365479, 0.00025481730699539185, 0.0002714395523071289, 0.00028806179761886597, 0.00030468404293060303, 0.0003213062882423401, 0.00033792853355407715, 0.0003545507788658142, 0.00037117302417755127, 0.00038779526948928833, 0.0004044175148010254, 0.00042103976011276245, 0.0004376620054244995, 0.00045428425073623657, 0.00047090649604797363, 0.0004875287413597107, 0.0005041509866714478, 0.0005207732319831848, 0.0005373954772949219]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 9.0, 8.0, 17.0, 19.0, 22.0, 41.0, 62.0, 118.0, 260.0, 176.0, 92.0, 49.0, 21.0, 19.0, 15.0, 13.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036978721618652344, -0.00035810843110084534, -0.00034642964601516724, -0.00033475086092948914, -0.00032307207584381104, -0.00031139329075813293, -0.00029971450567245483, -0.00028803572058677673, -0.00027635693550109863, -0.00026467815041542053, -0.00025299936532974243, -0.00024132058024406433, -0.00022964179515838623, -0.00021796301007270813, -0.00020628422498703003, -0.00019460543990135193, -0.00018292665481567383, -0.00017124786972999573, -0.00015956908464431763, -0.00014789029955863953, -0.00013621151447296143, -0.00012453272938728333, -0.00011285394430160522, -0.00010117515921592712, -8.949637413024902e-05, -7.781758904457092e-05, -6.613880395889282e-05, -5.446001887321472e-05, -4.278123378753662e-05, -3.110244870185852e-05, -1.942366361618042e-05, -7.74487853050232e-06, 3.933906555175781e-06, 1.5612691640853882e-05, 2.7291476726531982e-05, 3.897026181221008e-05, 5.0649046897888184e-05, 6.232783198356628e-05, 7.400661706924438e-05, 8.568540215492249e-05, 9.736418724060059e-05, 0.00010904297232627869, 0.00012072175741195679, 0.0001324005424976349, 0.000144079327583313, 0.0001557581126689911, 0.0001674368977546692, 0.0001791156828403473, 0.0001907944679260254, 0.0002024732530117035, 0.0002141520380973816, 0.0002258308231830597, 0.0002375096082687378, 0.0002491883933544159, 0.000260867178440094, 0.0002725459635257721, 0.0002842247486114502, 0.0002959035336971283, 0.0003075823187828064, 0.0003192611038684845, 0.0003309398889541626, 0.0003426186740398407, 0.0003542974591255188, 0.0003659762442111969, 0.000377655029296875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 62.0, 817.0, 116.0, 13.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.322879314422607, -6.2091569900512695, -6.095434665679932, -5.981712341308594, -5.867990016937256, -5.754267692565918, -5.640544891357422, -5.526822566986084, -5.413100242614746, -5.299377918243408, -5.18565559387207, -5.071933269500732, -4.9582109451293945, -4.844488143920898, -4.730766296386719, -4.617043495178223, -4.503321647644043, -4.389599323272705, -4.275876998901367, -4.162154674530029, -4.048432350158691, -3.9347097873687744, -3.8209874629974365, -3.7072651386260986, -3.5935425758361816, -3.4798202514648438, -3.366097927093506, -3.252375602722168, -3.138653039932251, -3.024930715560913, -2.911208391189575, -2.7974860668182373, -2.6837635040283203, -2.5700411796569824, -2.4563188552856445, -2.3425965309143066, -2.2288739681243896, -2.1151516437530518, -2.001429319381714, -1.887706995010376, -1.7739845514297485, -1.6602622270584106, -1.5465397834777832, -1.4328174591064453, -1.3190951347351074, -1.20537269115448, -1.091650366783142, -0.9779279828071594, -0.8642055988311768, -0.7504832148551941, -0.6367608308792114, -0.5230385065078735, -0.40931612253189087, -0.2955937385559082, -0.1818714141845703, -0.06814903020858765, 0.04557335376739502, 0.1592957228422165, 0.27301809191703796, 0.38674044609069824, 0.5004628300666809, 0.6141852140426636, 0.7279075384140015, 0.8416299223899841, 0.9553523063659668]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 4.0, 6.0, 14.0, 21.0, 21.0, 13.0, 29.0, 18.0, 34.0, 35.0, 49.0, 51.0, 50.0, 60.0, 55.0, 68.0, 63.0, 64.0, 56.0, 43.0, 35.0, 25.0, 36.0, 32.0, 23.0, 20.0, 12.0, 10.0, 8.0, 7.0, 5.0, 5.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.859506845474243, -2.778078079223633, -2.6966493129730225, -2.615220546722412, -2.5337915420532227, -2.4523627758026123, -2.370934009552002, -2.2895052433013916, -2.2080764770507812, -2.126647710800171, -2.0452189445495605, -1.9637900590896606, -1.8823612928390503, -1.80093252658844, -1.71950364112854, -1.6380748748779297, -1.5566461086273193, -1.475217342376709, -1.3937885761260986, -1.3123596906661987, -1.2309309244155884, -1.149502158164978, -1.0680732727050781, -0.9866445064544678, -0.9052157402038574, -0.8237869739532471, -0.7423581480979919, -0.6609293222427368, -0.5795005559921265, -0.4980717599391937, -0.416642963886261, -0.33521413803100586, -0.2537853717803955, -0.17235657572746277, -0.09092777967453003, -0.00949898362159729, 0.07192981243133545, 0.1533586084842682, 0.23478740453720093, 0.31621623039245605, 0.3976449966430664, 0.47907379269599915, 0.5605025887489319, 0.641931414604187, 0.7233601808547974, 0.8047889471054077, 0.8862177729606628, 0.967646598815918, 1.0490753650665283, 1.1305041313171387, 1.211932897567749, 1.293361783027649, 1.3747905492782593, 1.4562193155288696, 1.5376482009887695, 1.6190769672393799, 1.7005057334899902, 1.7819344997406006, 1.863363265991211, 1.9447921514511108, 2.0262207984924316, 2.107649803161621, 2.1890785694122314, 2.270507335662842, 2.351936101913452]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 7.0, 6.0, 5.0, 8.0, 8.0, 4.0, 7.0, 8.0, 9.0, 9.0, 13.0, 10.0, 10.0, 16.0, 19.0, 16.0, 26.0, 42.0, 42.0, 53.0, 85.0, 198.0, 719.0, 4190936.0, 1232.0, 420.0, 122.0, 50.0, 34.0, 34.0, 25.0, 25.0, 16.0, 10.0, 11.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0296630859375, -0.028751373291015625, -0.02783966064453125, -0.026927947998046875, -0.0260162353515625, -0.025104522705078125, -0.02419281005859375, -0.023281097412109375, -0.022369384765625, -0.021457672119140625, -0.02054595947265625, -0.019634246826171875, -0.0187225341796875, -0.017810821533203125, -0.01689910888671875, -0.015987396240234375, -0.01507568359375, -0.014163970947265625, -0.01325225830078125, -0.012340545654296875, -0.0114288330078125, -0.010517120361328125, -0.00960540771484375, -0.008693695068359375, -0.007781982421875, -0.006870269775390625, -0.00595855712890625, -0.005046844482421875, -0.0041351318359375, -0.003223419189453125, -0.00231170654296875, -0.001399993896484375, -0.00048828125, 0.000423431396484375, 0.00133514404296875, 0.002246856689453125, 0.0031585693359375, 0.004070281982421875, 0.00498199462890625, 0.005893707275390625, 0.006805419921875, 0.007717132568359375, 0.00862884521484375, 0.009540557861328125, 0.0104522705078125, 0.011363983154296875, 0.01227569580078125, 0.013187408447265625, 0.01409912109375, 0.015010833740234375, 0.01592254638671875, 0.016834259033203125, 0.0177459716796875, 0.018657684326171875, 0.01956939697265625, 0.020481109619140625, 0.021392822265625, 0.022304534912109375, 0.02321624755859375, 0.024127960205078125, 0.0250396728515625, 0.025951385498046875, 0.02686309814453125, 0.027774810791015625, 0.0286865234375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 8.0, 7.0, 7.0, 7.0, 10.0, 13.0, 37.0, 135.0, 224.0, 274.0, 137.0, 30.0, 7.0, 11.0, 4.0, 13.0, 6.0, 4.0, 4.0, 8.0, 2.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171142578125, -0.16570472717285156, -0.16026687622070312, -0.1548290252685547, -0.14939117431640625, -0.1439533233642578, -0.13851547241210938, -0.13307762145996094, -0.1276397705078125, -0.12220191955566406, -0.11676406860351562, -0.11132621765136719, -0.10588836669921875, -0.10045051574707031, -0.09501266479492188, -0.08957481384277344, -0.084136962890625, -0.07869911193847656, -0.07326126098632812, -0.06782341003417969, -0.06238555908203125, -0.05694770812988281, -0.051509857177734375, -0.04607200622558594, -0.0406341552734375, -0.03519630432128906, -0.029758453369140625, -0.024320602416992188, -0.01888275146484375, -0.013444900512695312, -0.008007049560546875, -0.0025691986083984375, 0.00286865234375, 0.008306503295898438, 0.013744354248046875, 0.019182205200195312, 0.02462005615234375, 0.030057907104492188, 0.035495758056640625, 0.04093360900878906, 0.0463714599609375, 0.05180931091308594, 0.057247161865234375, 0.06268501281738281, 0.06812286376953125, 0.07356071472167969, 0.07899856567382812, 0.08443641662597656, 0.089874267578125, 0.09531211853027344, 0.10074996948242188, 0.10618782043457031, 0.11162567138671875, 0.11706352233886719, 0.12250137329101562, 0.12793922424316406, 0.1333770751953125, 0.13881492614746094, 0.14425277709960938, 0.1496906280517578, 0.15512847900390625, 0.1605663299560547, 0.16600418090820312, 0.17144203186035156, 0.1768798828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 12.0, 20.0, 37.0, 73.0, 77.0, 117.0, 215.0, 673.0, 4191464.0, 1007.0, 243.0, 117.0, 87.0, 60.0, 39.0, 24.0, 12.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1103515625, -0.10798311233520508, -0.10561466217041016, -0.10324621200561523, -0.10087776184082031, -0.09850931167602539, -0.09614086151123047, -0.09377241134643555, -0.09140396118164062, -0.0890355110168457, -0.08666706085205078, -0.08429861068725586, -0.08193016052246094, -0.07956171035766602, -0.0771932601928711, -0.07482481002807617, -0.07245635986328125, -0.07008790969848633, -0.0677194595336914, -0.06535100936889648, -0.06298255920410156, -0.06061410903930664, -0.05824565887451172, -0.0558772087097168, -0.053508758544921875, -0.05114030838012695, -0.04877185821533203, -0.04640340805053711, -0.04403495788574219, -0.041666507720947266, -0.039298057556152344, -0.03692960739135742, -0.0345611572265625, -0.03219270706176758, -0.029824256896972656, -0.027455806732177734, -0.025087356567382812, -0.02271890640258789, -0.02035045623779297, -0.017982006072998047, -0.015613555908203125, -0.013245105743408203, -0.010876655578613281, -0.00850820541381836, -0.0061397552490234375, -0.0037713050842285156, -0.0014028549194335938, 0.0009655952453613281, 0.00333404541015625, 0.005702495574951172, 0.008070945739746094, 0.010439395904541016, 0.012807846069335938, 0.01517629623413086, 0.01754474639892578, 0.019913196563720703, 0.022281646728515625, 0.024650096893310547, 0.02701854705810547, 0.02938699722290039, 0.03175544738769531, 0.034123897552490234, 0.036492347717285156, 0.03886079788208008, 0.041229248046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 19.0, 4063.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007450103759765625, -0.006632745265960693, -0.005815386772155762, -0.00499802827835083, -0.0041806697845458984, -0.003363311290740967, -0.002545952796936035, -0.0017285943031311035, -0.0009112358093261719, -9.387731552124023e-05, 0.0007234811782836914, 0.001540839672088623, 0.0023581981658935547, 0.0031755566596984863, 0.003992915153503418, 0.00481027364730835, 0.005627632141113281, 0.006444990634918213, 0.0072623491287231445, 0.008079707622528076, 0.008897066116333008, 0.00971442461013794, 0.010531783103942871, 0.011349141597747803, 0.012166500091552734, 0.012983858585357666, 0.013801217079162598, 0.01461857557296753, 0.015435934066772461, 0.016253292560577393, 0.017070651054382324, 0.017888009548187256, 0.018705368041992188, 0.01952272653579712, 0.02034008502960205, 0.021157443523406982, 0.021974802017211914, 0.022792160511016846, 0.023609519004821777, 0.02442687749862671, 0.02524423599243164, 0.026061594486236572, 0.026878952980041504, 0.027696311473846436, 0.028513669967651367, 0.0293310284614563, 0.03014838695526123, 0.030965745449066162, 0.031783103942871094, 0.032600462436676025, 0.03341782093048096, 0.03423517942428589, 0.03505253791809082, 0.03586989641189575, 0.036687254905700684, 0.037504613399505615, 0.03832197189331055, 0.03913933038711548, 0.03995668888092041, 0.04077404737472534, 0.04159140586853027, 0.042408764362335205, 0.04322612285614014, 0.04404348134994507, 0.04486083984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 26.0, 976.0, 13.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11862185597419739, -0.11552400887012482, -0.11242616176605225, -0.10932831466197968, -0.1062304675579071, -0.10313262045383453, -0.10003477334976196, -0.09693692624568939, -0.09383907914161682, -0.09074123203754425, -0.08764338493347168, -0.08454553782939911, -0.08144769072532654, -0.07834984362125397, -0.0752519965171814, -0.07215414941310883, -0.06905630230903625, -0.06595845520496368, -0.06286060810089111, -0.05976276099681854, -0.05666491389274597, -0.0535670667886734, -0.05046921968460083, -0.04737137258052826, -0.04427352547645569, -0.04117567837238312, -0.03807783126831055, -0.034979984164237976, -0.031882137060165405, -0.028784289956092834, -0.025686442852020264, -0.022588595747947693, -0.019490748643875122, -0.01639290153980255, -0.01329505443572998, -0.01019720733165741, -0.007099360227584839, -0.004001513123512268, -0.0009036660194396973, 0.0021941810846328735, 0.005292028188705444, 0.008389875292778015, 0.011487722396850586, 0.014585569500923157, 0.017683416604995728, 0.0207812637090683, 0.02387911081314087, 0.02697695791721344, 0.03007480502128601, 0.03317265212535858, 0.03627049922943115, 0.03936834633350372, 0.042466193437576294, 0.045564040541648865, 0.048661887645721436, 0.051759734749794006, 0.05485758185386658, 0.05795542895793915, 0.06105327606201172, 0.06415112316608429, 0.06724897027015686, 0.07034681737422943, 0.073444664478302, 0.07654251158237457, 0.07964035868644714]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 9.0, 5.0, 8.0, 10.0, 12.0, 17.0, 24.0, 21.0, 30.0, 32.0, 44.0, 53.0, 54.0, 49.0, 62.0, 74.0, 77.0, 71.0, 68.0, 51.0, 41.0, 42.0, 37.0, 25.0, 17.0, 16.0, 17.0, 9.0, 11.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035218238830566406, -0.034300897270441055, -0.033383555710315704, -0.032466210424900055, -0.031548868864774704, -0.030631527304649353, -0.029714183881878853, -0.028796840459108353, -0.027879498898983, -0.02696215733885765, -0.02604481391608715, -0.02512747049331665, -0.0242101289331913, -0.02329278737306595, -0.02237544395029545, -0.021458100527524948, -0.020540758967399597, -0.019623417407274246, -0.018706073984503746, -0.017788730561733246, -0.016871389001607895, -0.015954047441482544, -0.015036704018712044, -0.014119361527264118, -0.013202019035816193, -0.012284676544368267, -0.011367334052920341, -0.010449991561472416, -0.00953264907002449, -0.008615306578576565, -0.007697964087128639, -0.006780621595680714, -0.005863279104232788, -0.0049459366127848625, -0.004028594121336937, -0.0031112516298890114, -0.002193909138441086, -0.0012765666469931602, -0.0003592241555452347, 0.0005581183359026909, 0.0014754608273506165, 0.002392803318798542, 0.0033101458102464676, 0.004227488301694393, 0.005144830793142319, 0.006062173284590244, 0.00697951577603817, 0.007896858267486095, 0.008814200758934021, 0.009731543250381947, 0.010648885741829872, 0.011566228233277798, 0.012483570724725723, 0.013400913216173649, 0.014318255707621574, 0.0152355981990695, 0.016152940690517426, 0.017070282250642776, 0.017987625673413277, 0.018904969096183777, 0.019822310656309128, 0.02073965221643448, 0.02165699563920498, 0.02257433906197548, 0.02349168062210083]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 9.0, 12.0, 16.0, 13.0, 34.0, 37.0, 49.0, 62.0, 106.0, 182.0, 293.0, 565.0, 1089.0, 2534.0, 6822.0, 33034.0, 964555.0, 28131.0, 6295.0, 2452.0, 1010.0, 462.0, 275.0, 154.0, 79.0, 53.0, 51.0, 30.0, 30.0, 18.0, 19.0, 13.0, 9.0, 8.0, 4.0, 7.0, 7.0, 3.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.473876953125, -0.4588127136230469, -0.44374847412109375, -0.4286842346191406, -0.4136199951171875, -0.3985557556152344, -0.38349151611328125, -0.3684272766113281, -0.353363037109375, -0.3382987976074219, -0.32323455810546875, -0.3081703186035156, -0.2931060791015625, -0.2780418395996094, -0.26297760009765625, -0.24791336059570312, -0.23284912109375, -0.21778488159179688, -0.20272064208984375, -0.18765640258789062, -0.1725921630859375, -0.15752792358398438, -0.14246368408203125, -0.12739944458007812, -0.112335205078125, -0.09727096557617188, -0.08220672607421875, -0.06714248657226562, -0.0520782470703125, -0.037014007568359375, -0.02194976806640625, -0.006885528564453125, 0.0081787109375, 0.023242950439453125, 0.03830718994140625, 0.053371429443359375, 0.0684356689453125, 0.08349990844726562, 0.09856414794921875, 0.11362838745117188, 0.128692626953125, 0.14375686645507812, 0.15882110595703125, 0.17388534545898438, 0.1889495849609375, 0.20401382446289062, 0.21907806396484375, 0.23414230346679688, 0.24920654296875, 0.2642707824707031, 0.27933502197265625, 0.2943992614746094, 0.3094635009765625, 0.3245277404785156, 0.33959197998046875, 0.3546562194824219, 0.369720458984375, 0.3847846984863281, 0.39984893798828125, 0.4149131774902344, 0.4299774169921875, 0.4450416564941406, 0.46010589599609375, 0.4751701354980469, 0.490234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 8.0, 7.0, 7.0, 7.0, 10.0, 13.0, 36.0, 137.0, 223.0, 273.0, 138.0, 30.0, 7.0, 11.0, 4.0, 13.0, 6.0, 4.0, 4.0, 8.0, 2.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171142578125, -0.16570472717285156, -0.16026687622070312, -0.1548290252685547, -0.14939117431640625, -0.1439533233642578, -0.13851547241210938, -0.13307762145996094, -0.1276397705078125, -0.12220191955566406, -0.11676406860351562, -0.11132621765136719, -0.10588836669921875, -0.10045051574707031, -0.09501266479492188, -0.08957481384277344, -0.084136962890625, -0.07869911193847656, -0.07326126098632812, -0.06782341003417969, -0.06238555908203125, -0.05694770812988281, -0.051509857177734375, -0.04607200622558594, -0.0406341552734375, -0.03519630432128906, -0.029758453369140625, -0.024320602416992188, -0.01888275146484375, -0.013444900512695312, -0.008007049560546875, -0.0025691986083984375, 0.00286865234375, 0.008306503295898438, 0.013744354248046875, 0.019182205200195312, 0.02462005615234375, 0.030057907104492188, 0.035495758056640625, 0.04093360900878906, 0.0463714599609375, 0.05180931091308594, 0.057247161865234375, 0.06268501281738281, 0.06812286376953125, 0.07356071472167969, 0.07899856567382812, 0.08443641662597656, 0.089874267578125, 0.09531211853027344, 0.10074996948242188, 0.10618782043457031, 0.11162567138671875, 0.11706352233886719, 0.12250137329101562, 0.12793922424316406, 0.1333770751953125, 0.13881492614746094, 0.14425277709960938, 0.1496906280517578, 0.15512847900390625, 0.1605663299560547, 0.16600418090820312, 0.17144203186035156, 0.1768798828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 6.0, 3.0, 5.0, 11.0, 8.0, 9.0, 9.0, 8.0, 12.0, 17.0, 24.0, 21.0, 29.0, 31.0, 40.0, 54.0, 67.0, 117.0, 213.0, 441.0, 1141.0, 6866.0, 1021444.0, 15328.0, 1376.0, 534.0, 233.0, 131.0, 77.0, 46.0, 30.0, 26.0, 24.0, 22.0, 25.0, 16.0, 16.0, 21.0, 6.0, 14.0, 9.0, 5.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.611328125, -0.5925750732421875, -0.573822021484375, -0.5550689697265625, -0.53631591796875, -0.5175628662109375, -0.498809814453125, -0.4800567626953125, -0.4613037109375, -0.4425506591796875, -0.423797607421875, -0.4050445556640625, -0.38629150390625, -0.3675384521484375, -0.348785400390625, -0.3300323486328125, -0.311279296875, -0.2925262451171875, -0.273773193359375, -0.2550201416015625, -0.23626708984375, -0.2175140380859375, -0.198760986328125, -0.1800079345703125, -0.1612548828125, -0.1425018310546875, -0.123748779296875, -0.1049957275390625, -0.08624267578125, -0.0674896240234375, -0.048736572265625, -0.0299835205078125, -0.01123046875, 0.0075225830078125, 0.026275634765625, 0.0450286865234375, 0.06378173828125, 0.0825347900390625, 0.101287841796875, 0.1200408935546875, 0.1387939453125, 0.1575469970703125, 0.176300048828125, 0.1950531005859375, 0.21380615234375, 0.2325592041015625, 0.251312255859375, 0.2700653076171875, 0.288818359375, 0.3075714111328125, 0.326324462890625, 0.3450775146484375, 0.36383056640625, 0.3825836181640625, 0.401336669921875, 0.4200897216796875, 0.4388427734375, 0.4575958251953125, 0.476348876953125, 0.4951019287109375, 0.51385498046875, 0.5326080322265625, 0.551361083984375, 0.5701141357421875, 0.5888671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 2.0, 5.0, 11.0, 8.0, 9.0, 9.0, 10.0, 11.0, 16.0, 24.0, 22.0, 29.0, 32.0, 35.0, 42.0, 28.0, 26.0, 38.0, 46.0, 39.0, 31.0, 38.0, 32.0, 27.0, 36.0, 40.0, 39.0, 31.0, 31.0, 25.0, 26.0, 24.0, 22.0, 25.0, 16.0, 16.0, 21.0, 6.0, 14.0, 9.0, 5.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.359619140625, -0.3485832214355469, -0.33754730224609375, -0.3265113830566406, -0.3154754638671875, -0.3044395446777344, -0.29340362548828125, -0.2823677062988281, -0.271331787109375, -0.2602958679199219, -0.24925994873046875, -0.23822402954101562, -0.2271881103515625, -0.21615219116210938, -0.20511627197265625, -0.19408035278320312, -0.18304443359375, -0.17200851440429688, -0.16097259521484375, -0.14993667602539062, -0.1389007568359375, -0.12786483764648438, -0.11682891845703125, -0.10579299926757812, -0.094757080078125, -0.08372116088867188, -0.07268524169921875, -0.061649322509765625, -0.0506134033203125, -0.039577484130859375, -0.02854156494140625, -0.017505645751953125, -0.0064697265625, 0.004566192626953125, 0.01560211181640625, 0.026638031005859375, 0.0376739501953125, 0.048709869384765625, 0.05974578857421875, 0.07078170776367188, 0.081817626953125, 0.09285354614257812, 0.10388946533203125, 0.11492538452148438, 0.1259613037109375, 0.13699722290039062, 0.14803314208984375, 0.15906906127929688, 0.17010498046875, 0.18114089965820312, 0.19217681884765625, 0.20321273803710938, 0.2142486572265625, 0.22528457641601562, 0.23632049560546875, 0.24735641479492188, 0.258392333984375, 0.2694282531738281, 0.28046417236328125, 0.2915000915527344, 0.3025360107421875, 0.3135719299316406, 0.32460784912109375, 0.3356437683105469, 0.3466796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 7.0, 9.0, 9.0, 13.0, 16.0, 23.0, 39.0, 70.0, 108.0, 168.0, 369.0, 794.0, 2580.0, 12393.0, 944692.0, 78277.0, 6125.0, 1636.0, 538.0, 290.0, 128.0, 85.0, 64.0, 39.0, 23.0, 14.0, 11.0, 7.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029206275939941406, -0.0002825818955898285, -0.0002731010317802429, -0.00026362016797065735, -0.0002541393041610718, -0.0002446584403514862, -0.00023517757654190063, -0.00022569671273231506, -0.0002162158489227295, -0.00020673498511314392, -0.00019725412130355835, -0.00018777325749397278, -0.0001782923936843872, -0.00016881152987480164, -0.00015933066606521606, -0.0001498498022556305, -0.00014036893844604492, -0.00013088807463645935, -0.00012140721082687378, -0.00011192634701728821, -0.00010244548320770264, -9.296461939811707e-05, -8.34837555885315e-05, -7.400289177894592e-05, -6.452202796936035e-05, -5.504116415977478e-05, -4.556030035018921e-05, -3.607943654060364e-05, -2.6598572731018066e-05, -1.7117708921432495e-05, -7.636845111846924e-06, 1.8440186977386475e-06, 1.1324882507324219e-05, 2.080574631690979e-05, 3.028661012649536e-05, 3.976747393608093e-05, 4.9248337745666504e-05, 5.8729201555252075e-05, 6.821006536483765e-05, 7.769092917442322e-05, 8.717179298400879e-05, 9.665265679359436e-05, 0.00010613352060317993, 0.0001156143844127655, 0.00012509524822235107, 0.00013457611203193665, 0.00014405697584152222, 0.0001535378396511078, 0.00016301870346069336, 0.00017249956727027893, 0.0001819804310798645, 0.00019146129488945007, 0.00020094215869903564, 0.00021042302250862122, 0.0002199038863182068, 0.00022938475012779236, 0.00023886561393737793, 0.0002483464777469635, 0.00025782734155654907, 0.00026730820536613464, 0.0002767890691757202, 0.0002862699329853058, 0.00029575079679489136, 0.00030523166060447693, 0.0003147125244140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 1.0, 6.0, 9.0, 15.0, 17.0, 16.0, 19.0, 32.0, 39.0, 47.0, 32.0, 85.0, 86.0, 88.0, 91.0, 82.0, 67.0, 73.0, 55.0, 31.0, 30.0, 15.0, 12.0, 13.0, 16.0, 9.0, 4.0, 5.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.020069122314453e-06, -5.846843123435974e-06, -5.673617124557495e-06, -5.500391125679016e-06, -5.327165126800537e-06, -5.153939127922058e-06, -4.980713129043579e-06, -4.8074871301651e-06, -4.634261131286621e-06, -4.461035132408142e-06, -4.287809133529663e-06, -4.114583134651184e-06, -3.941357135772705e-06, -3.768131136894226e-06, -3.594905138015747e-06, -3.421679139137268e-06, -3.248453140258789e-06, -3.07522714138031e-06, -2.902001142501831e-06, -2.728775143623352e-06, -2.555549144744873e-06, -2.382323145866394e-06, -2.209097146987915e-06, -2.035871148109436e-06, -1.862645149230957e-06, -1.689419150352478e-06, -1.516193151473999e-06, -1.34296715259552e-06, -1.169741153717041e-06, -9.96515154838562e-07, -8.23289155960083e-07, -6.50063157081604e-07, -4.76837158203125e-07, -3.03611159324646e-07, -1.30385160446167e-07, 4.284083843231201e-08, 2.1606683731079102e-07, 3.8929283618927e-07, 5.62518835067749e-07, 7.35744833946228e-07, 9.08970832824707e-07, 1.082196831703186e-06, 1.255422830581665e-06, 1.428648829460144e-06, 1.601874828338623e-06, 1.775100827217102e-06, 1.948326826095581e-06, 2.12155282497406e-06, 2.294778823852539e-06, 2.468004822731018e-06, 2.641230821609497e-06, 2.814456820487976e-06, 2.987682819366455e-06, 3.160908818244934e-06, 3.334134817123413e-06, 3.507360816001892e-06, 3.680586814880371e-06, 3.85381281375885e-06, 4.027038812637329e-06, 4.200264811515808e-06, 4.373490810394287e-06, 4.546716809272766e-06, 4.719942808151245e-06, 4.893168807029724e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 6.0, 9.0, 10.0, 7.0, 5.0, 14.0, 17.0, 23.0, 47.0, 90.0, 241.0, 726.0, 240868.0, 805285.0, 769.0, 205.0, 92.0, 40.0, 21.0, 20.0, 13.0, 13.0, 9.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007300376892089844, -0.0007072314620018005, -0.0006844252347946167, -0.0006616190075874329, -0.000638812780380249, -0.0006160065531730652, -0.0005932003259658813, -0.0005703940987586975, -0.0005475878715515137, -0.0005247816443443298, -0.000501975417137146, -0.00047916918992996216, -0.0004563629627227783, -0.0004335567355155945, -0.00041075050830841064, -0.0003879442811012268, -0.00036513805389404297, -0.00034233182668685913, -0.0003195255994796753, -0.00029671937227249146, -0.0002739131450653076, -0.0002511069178581238, -0.00022830069065093994, -0.0002054944634437561, -0.00018268823623657227, -0.00015988200902938843, -0.0001370757818222046, -0.00011426955461502075, -9.146332740783691e-05, -6.865710020065308e-05, -4.585087299346924e-05, -2.30446457862854e-05, -2.384185791015625e-07, 2.2567808628082275e-05, 4.537403583526611e-05, 6.818026304244995e-05, 9.098649024963379e-05, 0.00011379271745681763, 0.00013659894466400146, 0.0001594051718711853, 0.00018221139907836914, 0.00020501762628555298, 0.00022782385349273682, 0.00025063008069992065, 0.0002734363079071045, 0.00029624253511428833, 0.00031904876232147217, 0.000341854989528656, 0.00036466121673583984, 0.0003874674439430237, 0.0004102736711502075, 0.00043307989835739136, 0.0004558861255645752, 0.00047869235277175903, 0.0005014985799789429, 0.0005243048071861267, 0.0005471110343933105, 0.0005699172616004944, 0.0005927234888076782, 0.0006155297160148621, 0.0006383359432220459, 0.0006611421704292297, 0.0006839483976364136, 0.0007067546248435974, 0.0007295608520507812]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 6.0, 10.0, 9.0, 7.0, 5.0, 12.0, 14.0, 15.0, 25.0, 33.0, 74.0, 110.0, 180.0, 167.0, 118.0, 64.0, 43.0, 22.0, 16.0, 15.0, 11.0, 13.0, 9.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043010711669921875, -0.0004166699945926666, -0.0004032328724861145, -0.0003897957503795624, -0.00037635862827301025, -0.00036292150616645813, -0.000349484384059906, -0.0003360472619533539, -0.00032261013984680176, -0.00030917301774024963, -0.0002957358956336975, -0.0002822987735271454, -0.00026886165142059326, -0.00025542452931404114, -0.00024198740720748901, -0.0002285502851009369, -0.00021511316299438477, -0.00020167604088783264, -0.00018823891878128052, -0.0001748017966747284, -0.00016136467456817627, -0.00014792755246162415, -0.00013449043035507202, -0.0001210533082485199, -0.00010761618614196777, -9.417906403541565e-05, -8.074194192886353e-05, -6.73048198223114e-05, -5.386769771575928e-05, -4.043057560920715e-05, -2.699345350265503e-05, -1.3556331396102905e-05, -1.1920928955078125e-07, 1.3317912817001343e-05, 2.6755034923553467e-05, 4.019215703010559e-05, 5.3629279136657715e-05, 6.706640124320984e-05, 8.050352334976196e-05, 9.394064545631409e-05, 0.00010737776756286621, 0.00012081488966941833, 0.00013425201177597046, 0.00014768913388252258, 0.0001611262559890747, 0.00017456337809562683, 0.00018800050020217896, 0.00020143762230873108, 0.0002148747444152832, 0.00022831186652183533, 0.00024174898862838745, 0.0002551861107349396, 0.0002686232328414917, 0.0002820603549480438, 0.00029549747705459595, 0.00030893459916114807, 0.0003223717212677002, 0.0003358088433742523, 0.00034924596548080444, 0.00036268308758735657, 0.0003761202096939087, 0.0003895573318004608, 0.00040299445390701294, 0.00041643157601356506, 0.0004298686981201172]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 770.0, 197.0, 20.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5866167545318604, -2.467851161956787, -2.349085569381714, -2.2303199768066406, -2.1115543842315674, -1.9927887916564941, -1.8740230798721313, -1.755257487297058, -1.6364918947219849, -1.5177263021469116, -1.3989607095718384, -1.2801949977874756, -1.1614294052124023, -1.042663812637329, -0.9238982200622559, -0.8051326274871826, -0.6863670349121094, -0.5676014423370361, -0.4488358199596405, -0.3300701975822449, -0.21130460500717163, -0.09253901243209839, 0.02622663974761963, 0.14499223232269287, 0.2637578248977661, 0.38252341747283936, 0.5012890100479126, 0.6200546622276306, 0.7388202548027039, 0.8575858473777771, 0.9763514995574951, 1.0951170921325684, 1.2138824462890625, 1.3326480388641357, 1.451413631439209, 1.5701792240142822, 1.6889448165893555, 1.8077104091644287, 1.9264761209487915, 2.0452418327331543, 2.1640071868896484, 2.2827727794647217, 2.401538372039795, 2.520303964614868, 2.6390695571899414, 2.7578351497650146, 2.876600742340088, 2.9953665733337402, 3.1141321659088135, 3.2328977584838867, 3.35166335105896, 3.470428943634033, 3.5891945362091064, 3.7079601287841797, 3.826725959777832, 3.945491313934326, 4.0642571449279785, 4.183022975921631, 4.301788330078125, 4.420554161071777, 4.5393195152282715, 4.658085346221924, 4.776850700378418, 4.89561653137207, 5.0143818855285645]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 10.0, 9.0, 5.0, 8.0, 19.0, 8.0, 12.0, 17.0, 18.0, 25.0, 25.0, 23.0, 32.0, 34.0, 43.0, 57.0, 31.0, 53.0, 54.0, 49.0, 46.0, 50.0, 39.0, 49.0, 31.0, 35.0, 35.0, 29.0, 25.0, 24.0, 25.0, 12.0, 14.0, 16.0, 6.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.911253571510315, -1.8514207601547241, -1.7915879487991333, -1.7317551374435425, -1.6719223260879517, -1.6120895147323608, -1.5522565841674805, -1.4924237728118896, -1.4325909614562988, -1.372758150100708, -1.3129253387451172, -1.2530925273895264, -1.1932597160339355, -1.1334269046783447, -1.073594093322754, -1.013761281967163, -0.9539284706115723, -0.8940956592559814, -0.8342628479003906, -0.7744300365447998, -0.714597225189209, -0.6547644138336182, -0.5949315428733826, -0.5350987315177917, -0.4752659201622009, -0.4154331088066101, -0.3556002974510193, -0.2957674562931061, -0.23593464493751526, -0.17610183358192444, -0.11626899242401123, -0.05643618106842041, 0.003396749496459961, 0.06322956830263138, 0.1230623871088028, 0.1828952133655548, 0.24272802472114563, 0.30256083607673645, 0.36239367723464966, 0.4222264885902405, 0.4820592999458313, 0.5418921113014221, 0.6017249226570129, 0.6615577936172485, 0.7213906049728394, 0.7812234163284302, 0.841056227684021, 0.9008890390396118, 0.9607218503952026, 1.0205546617507935, 1.0803874731063843, 1.140220284461975, 1.200053095817566, 1.2598859071731567, 1.319718837738037, 1.379551649093628, 1.4393844604492188, 1.4992172718048096, 1.5590500831604004, 1.6188828945159912, 1.678715705871582, 1.7385485172271729, 1.7983813285827637, 1.8582141399383545, 1.9180469512939453]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 13.0, 4.0, 12.0, 16.0, 19.0, 29.0, 33.0, 56.0, 63.0, 88.0, 109.0, 173.0, 350.0, 1057.0, 4393.0, 4181834.0, 3655.0, 962.0, 399.0, 245.0, 167.0, 120.0, 85.0, 68.0, 53.0, 48.0, 35.0, 22.0, 19.0, 19.0, 10.0, 22.0, 10.0, 12.0, 16.0, 9.0, 8.0, 7.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.49609375, -2.41693115234375, -2.3377685546875, -2.25860595703125, -2.179443359375, -2.10028076171875, -2.0211181640625, -1.94195556640625, -1.86279296875, -1.78363037109375, -1.7044677734375, -1.62530517578125, -1.546142578125, -1.46697998046875, -1.3878173828125, -1.30865478515625, -1.2294921875, -1.15032958984375, -1.0711669921875, -0.99200439453125, -0.912841796875, -0.83367919921875, -0.7545166015625, -0.67535400390625, -0.59619140625, -0.51702880859375, -0.4378662109375, -0.35870361328125, -0.279541015625, -0.20037841796875, -0.1212158203125, -0.04205322265625, 0.037109375, 0.11627197265625, 0.1954345703125, 0.27459716796875, 0.353759765625, 0.43292236328125, 0.5120849609375, 0.59124755859375, 0.67041015625, 0.74957275390625, 0.8287353515625, 0.90789794921875, 0.987060546875, 1.06622314453125, 1.1453857421875, 1.22454833984375, 1.3037109375, 1.38287353515625, 1.4620361328125, 1.54119873046875, 1.620361328125, 1.69952392578125, 1.7786865234375, 1.85784912109375, 1.93701171875, 2.01617431640625, 2.0953369140625, 2.17449951171875, 2.253662109375, 2.33282470703125, 2.4119873046875, 2.49114990234375, 2.5703125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 4.0, 6.0, 9.0, 7.0, 7.0, 8.0, 15.0, 34.0, 127.0, 221.0, 271.0, 146.0, 38.0, 9.0, 6.0, 10.0, 10.0, 6.0, 3.0, 6.0, 7.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1710205078125, -0.16559410095214844, -0.16016769409179688, -0.1547412872314453, -0.14931488037109375, -0.1438884735107422, -0.13846206665039062, -0.13303565979003906, -0.1276092529296875, -0.12218284606933594, -0.11675643920898438, -0.11133003234863281, -0.10590362548828125, -0.10047721862792969, -0.09505081176757812, -0.08962440490722656, -0.084197998046875, -0.07877159118652344, -0.07334518432617188, -0.06791877746582031, -0.06249237060546875, -0.05706596374511719, -0.051639556884765625, -0.04621315002441406, -0.0407867431640625, -0.03536033630371094, -0.029933929443359375, -0.024507522583007812, -0.01908111572265625, -0.013654708862304688, -0.008228302001953125, -0.0028018951416015625, 0.00262451171875, 0.008050918579101562, 0.013477325439453125, 0.018903732299804688, 0.02433013916015625, 0.029756546020507812, 0.035182952880859375, 0.04060935974121094, 0.0460357666015625, 0.05146217346191406, 0.056888580322265625, 0.06231498718261719, 0.06774139404296875, 0.07316780090332031, 0.07859420776367188, 0.08402061462402344, 0.089447021484375, 0.09487342834472656, 0.10029983520507812, 0.10572624206542969, 0.11115264892578125, 0.11657905578613281, 0.12200546264648438, 0.12743186950683594, 0.1328582763671875, 0.13828468322753906, 0.14371109008789062, 0.1491374969482422, 0.15456390380859375, 0.1599903106689453, 0.16541671752929688, 0.17084312438964844, 0.17626953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 6.0, 7.0, 12.0, 12.0, 12.0, 10.0, 14.0, 15.0, 33.0, 39.0, 39.0, 68.0, 129.0, 384.0, 3704.0, 4150448.0, 37567.0, 1243.0, 209.0, 106.0, 56.0, 41.0, 27.0, 12.0, 14.0, 20.0, 11.0, 12.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7661361694335938, -0.7412567138671875, -0.7163772583007812, -0.691497802734375, -0.6666183471679688, -0.6417388916015625, -0.6168594360351562, -0.59197998046875, -0.5671005249023438, -0.5422210693359375, -0.5173416137695312, -0.492462158203125, -0.46758270263671875, -0.4427032470703125, -0.41782379150390625, -0.3929443359375, -0.36806488037109375, -0.3431854248046875, -0.31830596923828125, -0.293426513671875, -0.26854705810546875, -0.2436676025390625, -0.21878814697265625, -0.19390869140625, -0.16902923583984375, -0.1441497802734375, -0.11927032470703125, -0.094390869140625, -0.06951141357421875, -0.0446319580078125, -0.01975250244140625, 0.005126953125, 0.03000640869140625, 0.0548858642578125, 0.07976531982421875, 0.104644775390625, 0.12952423095703125, 0.1544036865234375, 0.17928314208984375, 0.20416259765625, 0.22904205322265625, 0.2539215087890625, 0.27880096435546875, 0.303680419921875, 0.32855987548828125, 0.3534393310546875, 0.37831878662109375, 0.4031982421875, 0.42807769775390625, 0.4529571533203125, 0.47783660888671875, 0.502716064453125, 0.5275955200195312, 0.5524749755859375, 0.5773544311523438, 0.60223388671875, 0.6271133422851562, 0.6519927978515625, 0.6768722534179688, 0.701751708984375, 0.7266311645507812, 0.7515106201171875, 0.7763900756835938, 0.80126953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 3.0, 8.0, 9.0, 16.0, 24.0, 48.0, 130.0, 922.0, 2444.0, 269.0, 85.0, 29.0, 12.0, 10.0, 15.0, 9.0, 6.0, 0.0, 3.0, 3.0, 6.0, 3.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31396484375, -0.3042144775390625, -0.294464111328125, -0.2847137451171875, -0.27496337890625, -0.2652130126953125, -0.255462646484375, -0.2457122802734375, -0.2359619140625, -0.2262115478515625, -0.216461181640625, -0.2067108154296875, -0.19696044921875, -0.1872100830078125, -0.177459716796875, -0.1677093505859375, -0.157958984375, -0.1482086181640625, -0.138458251953125, -0.1287078857421875, -0.11895751953125, -0.1092071533203125, -0.099456787109375, -0.0897064208984375, -0.0799560546875, -0.0702056884765625, -0.060455322265625, -0.0507049560546875, -0.04095458984375, -0.0312042236328125, -0.021453857421875, -0.0117034912109375, -0.001953125, 0.0077972412109375, 0.017547607421875, 0.0272979736328125, 0.03704833984375, 0.0467987060546875, 0.056549072265625, 0.0662994384765625, 0.0760498046875, 0.0858001708984375, 0.095550537109375, 0.1053009033203125, 0.11505126953125, 0.1248016357421875, 0.134552001953125, 0.1443023681640625, 0.154052734375, 0.1638031005859375, 0.173553466796875, 0.1833038330078125, 0.19305419921875, 0.2028045654296875, 0.212554931640625, 0.2223052978515625, 0.2320556640625, 0.2418060302734375, 0.251556396484375, 0.2613067626953125, 0.27105712890625, 0.2808074951171875, 0.290557861328125, 0.3003082275390625, 0.31005859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 14.0, 886.0, 113.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.184982776641846, -4.079996585845947, -3.975010633468628, -3.8700246810913086, -3.76503849029541, -3.6600522994995117, -3.5550663471221924, -3.450080394744873, -3.3450942039489746, -3.240108013153076, -3.135122060775757, -3.0301361083984375, -2.925149917602539, -2.8201637268066406, -2.7151777744293213, -2.610191822052002, -2.5052056312561035, -2.400219440460205, -2.2952334880828857, -2.1902475357055664, -2.085261344909668, -1.980275273323059, -1.8752892017364502, -1.7703031301498413, -1.6653170585632324, -1.5603309869766235, -1.4553449153900146, -1.3503588438034058, -1.2453727722167969, -1.140386700630188, -1.035400629043579, -0.9304145574569702, -0.8254287242889404, -0.7204426527023315, -0.6154565811157227, -0.5104705095291138, -0.4054844379425049, -0.300498366355896, -0.1955122947692871, -0.09052622318267822, 0.014459848403930664, 0.11944591999053955, 0.22443199157714844, 0.3294180631637573, 0.4344041347503662, 0.5393902063369751, 0.644376277923584, 0.7493623495101929, 0.8543484210968018, 0.9593344926834106, 1.0643205642700195, 1.1693066358566284, 1.2742927074432373, 1.3792787790298462, 1.484264850616455, 1.589250922203064, 1.6942369937896729, 1.7992230653762817, 1.9042091369628906, 2.009195327758789, 2.1141812801361084, 2.2191672325134277, 2.324153423309326, 2.4291396141052246, 2.534125566482544]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 12.0, 2.0, 10.0, 17.0, 13.0, 13.0, 17.0, 21.0, 11.0, 27.0, 42.0, 23.0, 31.0, 40.0, 36.0, 42.0, 53.0, 46.0, 38.0, 41.0, 43.0, 56.0, 44.0, 30.0, 41.0, 31.0, 23.0, 22.0, 26.0, 27.0, 19.0, 14.0, 14.0, 8.0, 15.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.746130108833313, -0.7244852781295776, -0.7028404474258423, -0.6811956167221069, -0.6595507860183716, -0.6379059553146362, -0.6162611246109009, -0.5946162939071655, -0.5729714632034302, -0.5513266324996948, -0.5296818017959595, -0.5080369710922241, -0.48639214038848877, -0.4647473096847534, -0.4431024491786957, -0.4214576184749603, -0.3998127579689026, -0.37816792726516724, -0.3565230965614319, -0.33487826585769653, -0.3132334351539612, -0.29158860445022583, -0.2699437439441681, -0.24829891324043274, -0.2266540825366974, -0.20500925183296204, -0.18336442112922668, -0.16171957552433014, -0.1400747448205948, -0.11842991411685944, -0.09678506851196289, -0.07514023780822754, -0.05349540710449219, -0.03185057267546654, -0.010205738246440887, 0.011439099907875061, 0.03308393061161041, 0.054728761315345764, 0.07637360692024231, 0.09801843762397766, 0.11966326832771301, 0.14130809903144836, 0.16295292973518372, 0.18459777534008026, 0.2062426060438156, 0.22788743674755096, 0.2495322823524475, 0.27117711305618286, 0.2928219437599182, 0.31446677446365356, 0.3361116051673889, 0.35775643587112427, 0.3794012665748596, 0.40104609727859497, 0.4226909577846527, 0.44433578848838806, 0.4659806191921234, 0.48762544989585876, 0.5092703104019165, 0.5309151411056519, 0.5525599718093872, 0.5742048025131226, 0.5958496332168579, 0.6174944639205933, 0.6391392946243286]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 6.0, 8.0, 8.0, 10.0, 12.0, 16.0, 14.0, 30.0, 39.0, 58.0, 65.0, 79.0, 110.0, 166.0, 201.0, 259.0, 375.0, 528.0, 776.0, 1146.0, 1895.0, 3396.0, 7758.0, 39162.0, 944858.0, 31613.0, 7047.0, 3164.0, 1787.0, 1066.0, 735.0, 528.0, 413.0, 312.0, 216.0, 181.0, 139.0, 108.0, 71.0, 48.0, 41.0, 28.0, 20.0, 16.0, 15.0, 7.0, 7.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0250396728515625, -0.992462158203125, -0.9598846435546875, -0.92730712890625, -0.8947296142578125, -0.862152099609375, -0.8295745849609375, -0.7969970703125, -0.7644195556640625, -0.731842041015625, -0.6992645263671875, -0.66668701171875, -0.6341094970703125, -0.601531982421875, -0.5689544677734375, -0.536376953125, -0.5037994384765625, -0.471221923828125, -0.4386444091796875, -0.40606689453125, -0.3734893798828125, -0.340911865234375, -0.3083343505859375, -0.2757568359375, -0.2431793212890625, -0.210601806640625, -0.1780242919921875, -0.14544677734375, -0.1128692626953125, -0.080291748046875, -0.0477142333984375, -0.01513671875, 0.0174407958984375, 0.050018310546875, 0.0825958251953125, 0.11517333984375, 0.1477508544921875, 0.180328369140625, 0.2129058837890625, 0.2454833984375, 0.2780609130859375, 0.310638427734375, 0.3432159423828125, 0.37579345703125, 0.4083709716796875, 0.440948486328125, 0.4735260009765625, 0.506103515625, 0.5386810302734375, 0.571258544921875, 0.6038360595703125, 0.63641357421875, 0.6689910888671875, 0.701568603515625, 0.7341461181640625, 0.7667236328125, 0.7993011474609375, 0.831878662109375, 0.8644561767578125, 0.89703369140625, 0.9296112060546875, 0.962188720703125, 0.9947662353515625, 1.02734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 4.0, 6.0, 9.0, 7.0, 7.0, 8.0, 15.0, 34.0, 125.0, 220.0, 276.0, 143.0, 36.0, 13.0, 4.0, 10.0, 11.0, 6.0, 3.0, 6.0, 7.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1710205078125, -0.16559600830078125, -0.1601715087890625, -0.15474700927734375, -0.149322509765625, -0.14389801025390625, -0.1384735107421875, -0.13304901123046875, -0.12762451171875, -0.12220001220703125, -0.1167755126953125, -0.11135101318359375, -0.105926513671875, -0.10050201416015625, -0.0950775146484375, -0.08965301513671875, -0.084228515625, -0.07880401611328125, -0.0733795166015625, -0.06795501708984375, -0.062530517578125, -0.05710601806640625, -0.0516815185546875, -0.04625701904296875, -0.04083251953125, -0.03540802001953125, -0.0299835205078125, -0.02455902099609375, -0.019134521484375, -0.01371002197265625, -0.0082855224609375, -0.00286102294921875, 0.0025634765625, 0.00798797607421875, 0.0134124755859375, 0.01883697509765625, 0.024261474609375, 0.02968597412109375, 0.0351104736328125, 0.04053497314453125, 0.04595947265625, 0.05138397216796875, 0.0568084716796875, 0.06223297119140625, 0.067657470703125, 0.07308197021484375, 0.0785064697265625, 0.08393096923828125, 0.08935546875, 0.09477996826171875, 0.1002044677734375, 0.10562896728515625, 0.111053466796875, 0.11647796630859375, 0.1219024658203125, 0.12732696533203125, 0.13275146484375, 0.13817596435546875, 0.1436004638671875, 0.14902496337890625, 0.154449462890625, 0.15987396240234375, 0.1652984619140625, 0.17072296142578125, 0.1761474609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 1.0, 7.0, 12.0, 10.0, 27.0, 34.0, 45.0, 58.0, 58.0, 110.0, 158.0, 161.0, 245.0, 468.0, 1015.0, 10465.0, 1028717.0, 4773.0, 902.0, 399.0, 232.0, 167.0, 122.0, 101.0, 74.0, 60.0, 47.0, 27.0, 12.0, 19.0, 6.0, 11.0, 7.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0369110107421875, -0.997650146484375, -0.9583892822265625, -0.91912841796875, -0.8798675537109375, -0.840606689453125, -0.8013458251953125, -0.7620849609375, -0.7228240966796875, -0.683563232421875, -0.6443023681640625, -0.60504150390625, -0.5657806396484375, -0.526519775390625, -0.4872589111328125, -0.447998046875, -0.4087371826171875, -0.369476318359375, -0.3302154541015625, -0.29095458984375, -0.2516937255859375, -0.212432861328125, -0.1731719970703125, -0.1339111328125, -0.0946502685546875, -0.055389404296875, -0.0161285400390625, 0.02313232421875, 0.0623931884765625, 0.101654052734375, 0.1409149169921875, 0.18017578125, 0.2194366455078125, 0.258697509765625, 0.2979583740234375, 0.33721923828125, 0.3764801025390625, 0.415740966796875, 0.4550018310546875, 0.4942626953125, 0.5335235595703125, 0.572784423828125, 0.6120452880859375, 0.65130615234375, 0.6905670166015625, 0.729827880859375, 0.7690887451171875, 0.808349609375, 0.8476104736328125, 0.886871337890625, 0.9261322021484375, 0.96539306640625, 1.0046539306640625, 1.043914794921875, 1.0831756591796875, 1.1224365234375, 1.1616973876953125, 1.200958251953125, 1.2402191162109375, 1.27947998046875, 1.3187408447265625, 1.358001708984375, 1.3972625732421875, 1.4365234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 0.0, 5.0, 9.0, 8.0, 11.0, 13.0, 20.0, 26.0, 29.0, 16.0, 37.0, 45.0, 34.0, 43.0, 49.0, 51.0, 45.0, 64.0, 46.0, 38.0, 51.0, 51.0, 42.0, 36.0, 41.0, 31.0, 41.0, 28.0, 28.0, 15.0, 13.0, 13.0, 6.0, 3.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.34812164306640625, -0.3329620361328125, -0.31780242919921875, -0.302642822265625, -0.28748321533203125, -0.2723236083984375, -0.25716400146484375, -0.24200439453125, -0.22684478759765625, -0.2116851806640625, -0.19652557373046875, -0.181365966796875, -0.16620635986328125, -0.1510467529296875, -0.13588714599609375, -0.1207275390625, -0.10556793212890625, -0.0904083251953125, -0.07524871826171875, -0.060089111328125, -0.04492950439453125, -0.0297698974609375, -0.01461029052734375, 0.00054931640625, 0.01570892333984375, 0.0308685302734375, 0.04602813720703125, 0.061187744140625, 0.07634735107421875, 0.0915069580078125, 0.10666656494140625, 0.121826171875, 0.13698577880859375, 0.1521453857421875, 0.16730499267578125, 0.182464599609375, 0.19762420654296875, 0.2127838134765625, 0.22794342041015625, 0.24310302734375, 0.25826263427734375, 0.2734222412109375, 0.28858184814453125, 0.303741455078125, 0.31890106201171875, 0.3340606689453125, 0.34922027587890625, 0.3643798828125, 0.37953948974609375, 0.3946990966796875, 0.40985870361328125, 0.425018310546875, 0.44017791748046875, 0.4553375244140625, 0.47049713134765625, 0.48565673828125, 0.5008163452148438, 0.5159759521484375, 0.5311355590820312, 0.546295166015625, 0.5614547729492188, 0.5766143798828125, 0.5917739868164062, 0.60693359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 12.0, 12.0, 19.0, 40.0, 63.0, 101.0, 182.0, 401.0, 1146.0, 4836.0, 108104.0, 924523.0, 6760.0, 1390.0, 461.0, 213.0, 114.0, 52.0, 40.0, 21.0, 13.0, 7.0, 14.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001850128173828125, -0.0017942041158676147, -0.0017382800579071045, -0.0016823559999465942, -0.001626431941986084, -0.0015705078840255737, -0.0015145838260650635, -0.0014586597681045532, -0.001402735710144043, -0.0013468116521835327, -0.0012908875942230225, -0.0012349635362625122, -0.001179039478302002, -0.0011231154203414917, -0.0010671913623809814, -0.0010112673044204712, -0.0009553432464599609, -0.0008994191884994507, -0.0008434951305389404, -0.0007875710725784302, -0.0007316470146179199, -0.0006757229566574097, -0.0006197988986968994, -0.0005638748407363892, -0.0005079507827758789, -0.00045202672481536865, -0.0003961026668548584, -0.00034017860889434814, -0.0002842545509338379, -0.00022833049297332764, -0.00017240643501281738, -0.00011648237705230713, -6.0558319091796875e-05, -4.634261131286621e-06, 5.128979682922363e-05, 0.00010721385478973389, 0.00016313791275024414, 0.0002190619707107544, 0.00027498602867126465, 0.0003309100866317749, 0.00038683414459228516, 0.0004427582025527954, 0.0004986822605133057, 0.0005546063184738159, 0.0006105303764343262, 0.0006664544343948364, 0.0007223784923553467, 0.0007783025503158569, 0.0008342266082763672, 0.0008901506662368774, 0.0009460747241973877, 0.001001998782157898, 0.0010579228401184082, 0.0011138468980789185, 0.0011697709560394287, 0.001225695013999939, 0.0012816190719604492, 0.0013375431299209595, 0.0013934671878814697, 0.00144939124584198, 0.0015053153038024902, 0.0015612393617630005, 0.0016171634197235107, 0.001673087477684021, 0.0017290115356445312]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 7.0, 5.0, 7.0, 11.0, 14.0, 13.0, 19.0, 26.0, 37.0, 42.0, 42.0, 54.0, 64.0, 76.0, 58.0, 75.0, 69.0, 65.0, 56.0, 39.0, 51.0, 33.0, 28.0, 17.0, 19.0, 14.0, 7.0, 13.0, 5.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.205402314662933e-06, -5.973502993583679e-06, -5.741603672504425e-06, -5.509704351425171e-06, -5.277805030345917e-06, -5.045905709266663e-06, -4.8140063881874084e-06, -4.582107067108154e-06, -4.3502077460289e-06, -4.118308424949646e-06, -3.886409103870392e-06, -3.6545097827911377e-06, -3.4226104617118835e-06, -3.1907111406326294e-06, -2.9588118195533752e-06, -2.726912498474121e-06, -2.495013177394867e-06, -2.263113856315613e-06, -2.0312145352363586e-06, -1.7993152141571045e-06, -1.5674158930778503e-06, -1.3355165719985962e-06, -1.103617250919342e-06, -8.717179298400879e-07, -6.398186087608337e-07, -4.079192876815796e-07, -1.7601996660232544e-07, 5.587935447692871e-08, 2.8777867555618286e-07, 5.19677996635437e-07, 7.515773177146912e-07, 9.834766387939453e-07, 1.2153759598731995e-06, 1.4472752809524536e-06, 1.6791746020317078e-06, 1.911073923110962e-06, 2.142973244190216e-06, 2.3748725652694702e-06, 2.6067718863487244e-06, 2.8386712074279785e-06, 3.0705705285072327e-06, 3.302469849586487e-06, 3.534369170665741e-06, 3.766268491744995e-06, 3.998167812824249e-06, 4.230067133903503e-06, 4.4619664549827576e-06, 4.693865776062012e-06, 4.925765097141266e-06, 5.15766441822052e-06, 5.389563739299774e-06, 5.621463060379028e-06, 5.8533623814582825e-06, 6.085261702537537e-06, 6.317161023616791e-06, 6.549060344696045e-06, 6.780959665775299e-06, 7.012858986854553e-06, 7.244758307933807e-06, 7.4766576290130615e-06, 7.708556950092316e-06, 7.94045627117157e-06, 8.172355592250824e-06, 8.404254913330078e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 12.0, 7.0, 11.0, 16.0, 23.0, 34.0, 47.0, 78.0, 132.0, 230.0, 713.0, 23355.0, 1021809.0, 1291.0, 334.0, 155.0, 77.0, 67.0, 39.0, 27.0, 20.0, 19.0, 8.0, 3.0, 8.0, 6.0, 3.0, 8.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019178390502929688, -0.0018542557954788208, -0.0017906725406646729, -0.001727089285850525, -0.001663506031036377, -0.001599922776222229, -0.001536339521408081, -0.001472756266593933, -0.0014091730117797852, -0.0013455897569656372, -0.0012820065021514893, -0.0012184232473373413, -0.0011548399925231934, -0.0010912567377090454, -0.0010276734828948975, -0.0009640902280807495, -0.0009005069732666016, -0.0008369237184524536, -0.0007733404636383057, -0.0007097572088241577, -0.0006461739540100098, -0.0005825906991958618, -0.0005190074443817139, -0.0004554241895675659, -0.00039184093475341797, -0.00032825767993927, -0.00026467442512512207, -0.00020109117031097412, -0.00013750791549682617, -7.392466068267822e-05, -1.0341405868530273e-05, 5.3241848945617676e-05, 0.00011682510375976562, 0.00018040835857391357, 0.00024399161338806152, 0.00030757486820220947, 0.0003711581230163574, 0.00043474137783050537, 0.0004983246326446533, 0.0005619078874588013, 0.0006254911422729492, 0.0006890743970870972, 0.0007526576519012451, 0.0008162409067153931, 0.000879824161529541, 0.000943407416343689, 0.001006990671157837, 0.0010705739259719849, 0.0011341571807861328, 0.0011977404356002808, 0.0012613236904144287, 0.0013249069452285767, 0.0013884902000427246, 0.0014520734548568726, 0.0015156567096710205, 0.0015792399644851685, 0.0016428232192993164, 0.0017064064741134644, 0.0017699897289276123, 0.0018335729837417603, 0.0018971562385559082, 0.001960739493370056, 0.002024322748184204, 0.002087906002998352, 0.0021514892578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 1.0, 6.0, 4.0, 4.0, 7.0, 8.0, 14.0, 11.0, 20.0, 35.0, 46.0, 87.0, 163.0, 286.0, 107.0, 47.0, 42.0, 24.0, 25.0, 15.0, 14.0, 12.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008106231689453125, -0.0007837414741516113, -0.0007568597793579102, -0.000729978084564209, -0.0007030963897705078, -0.0006762146949768066, -0.0006493330001831055, -0.0006224513053894043, -0.0005955696105957031, -0.000568687915802002, -0.0005418062210083008, -0.0005149245262145996, -0.00048804283142089844, -0.00046116113662719727, -0.0004342794418334961, -0.0004073977470397949, -0.00038051605224609375, -0.0003536343574523926, -0.0003267526626586914, -0.00029987096786499023, -0.00027298927307128906, -0.0002461075782775879, -0.00021922588348388672, -0.00019234418869018555, -0.00016546249389648438, -0.0001385807991027832, -0.00011169910430908203, -8.481740951538086e-05, -5.793571472167969e-05, -3.1054019927978516e-05, -4.172325134277344e-06, 2.2709369659423828e-05, 4.9591064453125e-05, 7.647275924682617e-05, 0.00010335445404052734, 0.00013023614883422852, 0.0001571178436279297, 0.00018399953842163086, 0.00021088123321533203, 0.0002377629280090332, 0.0002646446228027344, 0.00029152631759643555, 0.0003184080123901367, 0.0003452897071838379, 0.00037217140197753906, 0.00039905309677124023, 0.0004259347915649414, 0.0004528164863586426, 0.00047969818115234375, 0.0005065798759460449, 0.0005334615707397461, 0.0005603432655334473, 0.0005872249603271484, 0.0006141066551208496, 0.0006409883499145508, 0.000667870044708252, 0.0006947517395019531, 0.0007216334342956543, 0.0007485151290893555, 0.0007753968238830566, 0.0008022785186767578, 0.000829160213470459, 0.0008560419082641602, 0.0008829236030578613, 0.0009098052978515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [23.0, 974.0, 18.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4046477973461151, -0.1024133563041687, 0.1998210847377777, 0.5020555257797241, 0.8042899370193481, 1.1065243482589722, 1.4087588787078857, 1.7109932899475098, 2.013227701187134, 2.315462112426758, 2.617696523666382, 2.919930934906006, 3.222165584564209, 3.524399757385254, 3.826634407043457, 4.12886905670166, 4.431103229522705, 4.733337879180908, 5.035572052001953, 5.337806701660156, 5.640040874481201, 5.942275524139404, 6.244509696960449, 6.546744346618652, 6.8489789962768555, 7.151213645935059, 7.4534478187561035, 7.755682468414307, 8.057916641235352, 8.360151290893555, 8.662385940551758, 8.964620590209961, 9.266854286193848, 9.56908893585205, 9.871323585510254, 10.17355728149414, 10.475791931152344, 10.778026580810547, 11.08026123046875, 11.382495880126953, 11.68472957611084, 11.986964225769043, 12.289198875427246, 12.591432571411133, 12.893667221069336, 13.195901870727539, 13.498136520385742, 13.800371170043945, 14.102605819702148, 14.404840469360352, 14.707075119018555, 15.009308815002441, 15.311543464660645, 15.613778114318848, 15.91601276397705, 16.218246459960938, 16.52048110961914, 16.822715759277344, 17.124950408935547, 17.42718505859375, 17.729419708251953, 18.031652450561523, 18.333887100219727, 18.63612174987793, 18.938356399536133]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 20.0, 16.0, 15.0, 22.0, 22.0, 36.0, 28.0, 40.0, 39.0, 45.0, 46.0, 66.0, 65.0, 44.0, 55.0, 58.0, 41.0, 43.0, 41.0, 35.0, 25.0, 25.0, 28.0, 20.0, 25.0, 13.0, 10.0, 7.0, 5.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9260327816009521, -1.868394136428833, -1.8107556104660034, -1.7531169652938843, -1.6954784393310547, -1.6378397941589355, -1.5802011489868164, -1.5225626230239868, -1.4649239778518677, -1.4072853326797485, -1.349646806716919, -1.2920081615447998, -1.2343696355819702, -1.176730990409851, -1.1190924644470215, -1.0614538192749023, -1.0038151741027832, -0.9461765885353088, -0.8885380029678345, -0.8308993577957153, -0.773260772228241, -0.7156221866607666, -0.6579836010932922, -0.6003450155258179, -0.5427064895629883, -0.4850679039955139, -0.42742928862571716, -0.3697907030582428, -0.31215208768844604, -0.2545135021209717, -0.19687491655349731, -0.13923630118370056, -0.08159768581390381, -0.023959089070558548, 0.03367950767278671, 0.09131810069084167, 0.14895670115947723, 0.2065953016281128, 0.26423388719558716, 0.3218725025653839, 0.3795110881328583, 0.43714967370033264, 0.4947882890701294, 0.5524268746376038, 0.6100654602050781, 0.6677041053771973, 0.7253426313400269, 0.782981276512146, 0.8406198620796204, 0.8982584476470947, 0.9558970332145691, 1.0135356187820435, 1.0711742639541626, 1.1288127899169922, 1.1864514350891113, 1.2440900802612305, 1.30172860622406, 1.3593672513961792, 1.4170057773590088, 1.474644422531128, 1.5322829484939575, 1.5899215936660767, 1.6475601196289062, 1.7051987648010254, 1.7628374099731445]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 5.0, 5.0, 11.0, 20.0, 16.0, 17.0, 25.0, 36.0, 74.0, 199.0, 820.0, 4191019.0, 1552.0, 183.0, 50.0, 39.0, 28.0, 24.0, 18.0, 16.0, 21.0, 12.0, 8.0, 6.0, 9.0, 7.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.15625, -51.4765625, -49.796875, -48.1171875, -46.4375, -44.7578125, -43.078125, -41.3984375, -39.71875, -38.0390625, -36.359375, -34.6796875, -33.0, -31.3203125, -29.640625, -27.9609375, -26.28125, -24.6015625, -22.921875, -21.2421875, -19.5625, -17.8828125, -16.203125, -14.5234375, -12.84375, -11.1640625, -9.484375, -7.8046875, -6.125, -4.4453125, -2.765625, -1.0859375, 0.59375, 2.2734375, 3.953125, 5.6328125, 7.3125, 8.9921875, 10.671875, 12.3515625, 14.03125, 15.7109375, 17.390625, 19.0703125, 20.75, 22.4296875, 24.109375, 25.7890625, 27.46875, 29.1484375, 30.828125, 32.5078125, 34.1875, 35.8671875, 37.546875, 39.2265625, 40.90625, 42.5859375, 44.265625, 45.9453125, 47.625, 49.3046875, 50.984375, 52.6640625, 54.34375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 5.0, 12.0, 7.0, 6.0, 7.0, 16.0, 29.0, 112.0, 209.0, 286.0, 152.0, 46.0, 11.0, 8.0, 8.0, 11.0, 7.0, 3.0, 6.0, 7.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16537857055664062, -0.15998077392578125, -0.15458297729492188, -0.1491851806640625, -0.14378738403320312, -0.13838958740234375, -0.13299179077148438, -0.127593994140625, -0.12219619750976562, -0.11679840087890625, -0.11140060424804688, -0.1060028076171875, -0.10060501098632812, -0.09520721435546875, -0.08980941772460938, -0.08441162109375, -0.07901382446289062, -0.07361602783203125, -0.06821823120117188, -0.0628204345703125, -0.057422637939453125, -0.05202484130859375, -0.046627044677734375, -0.041229248046875, -0.035831451416015625, -0.03043365478515625, -0.025035858154296875, -0.0196380615234375, -0.014240264892578125, -0.00884246826171875, -0.003444671630859375, 0.001953125, 0.007350921630859375, 0.01274871826171875, 0.018146514892578125, 0.0235443115234375, 0.028942108154296875, 0.03433990478515625, 0.039737701416015625, 0.045135498046875, 0.050533294677734375, 0.05593109130859375, 0.061328887939453125, 0.0667266845703125, 0.07212448120117188, 0.07752227783203125, 0.08292007446289062, 0.08831787109375, 0.09371566772460938, 0.09911346435546875, 0.10451126098632812, 0.1099090576171875, 0.11530685424804688, 0.12070465087890625, 0.12610244750976562, 0.131500244140625, 0.13689804077148438, 0.14229583740234375, 0.14769363403320312, 0.1530914306640625, 0.15848922729492188, 0.16388702392578125, 0.16928482055664062, 0.1746826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 17.0, 16.0, 28.0, 34.0, 63.0, 100.0, 195.0, 368.0, 746.0, 1999.0, 6770.0, 4040195.0, 133880.0, 6338.0, 1981.0, 752.0, 344.0, 170.0, 97.0, 52.0, 40.0, 20.0, 16.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.311492919921875, -1.27044677734375, -1.229400634765625, -1.1883544921875, -1.147308349609375, -1.10626220703125, -1.065216064453125, -1.024169921875, -0.983123779296875, -0.94207763671875, -0.901031494140625, -0.8599853515625, -0.818939208984375, -0.77789306640625, -0.736846923828125, -0.69580078125, -0.654754638671875, -0.61370849609375, -0.572662353515625, -0.5316162109375, -0.490570068359375, -0.44952392578125, -0.408477783203125, -0.367431640625, -0.326385498046875, -0.28533935546875, -0.244293212890625, -0.2032470703125, -0.162200927734375, -0.12115478515625, -0.080108642578125, -0.0390625, 0.001983642578125, 0.04302978515625, 0.084075927734375, 0.1251220703125, 0.166168212890625, 0.20721435546875, 0.248260498046875, 0.289306640625, 0.330352783203125, 0.37139892578125, 0.412445068359375, 0.4534912109375, 0.494537353515625, 0.53558349609375, 0.576629638671875, 0.61767578125, 0.658721923828125, 0.69976806640625, 0.740814208984375, 0.7818603515625, 0.822906494140625, 0.86395263671875, 0.904998779296875, 0.946044921875, 0.987091064453125, 1.02813720703125, 1.069183349609375, 1.1102294921875, 1.151275634765625, 1.19232177734375, 1.233367919921875, 1.2744140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 12.0, 37.0, 86.0, 3620.0, 187.0, 39.0, 14.0, 6.0, 4.0, 5.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26708984375, -0.2574424743652344, -0.24779510498046875, -0.23814773559570312, -0.2285003662109375, -0.21885299682617188, -0.20920562744140625, -0.19955825805664062, -0.189910888671875, -0.18026351928710938, -0.17061614990234375, -0.16096878051757812, -0.1513214111328125, -0.14167404174804688, -0.13202667236328125, -0.12237930297851562, -0.11273193359375, -0.10308456420898438, -0.09343719482421875, -0.08378982543945312, -0.0741424560546875, -0.06449508666992188, -0.05484771728515625, -0.045200347900390625, -0.035552978515625, -0.025905609130859375, -0.01625823974609375, -0.006610870361328125, 0.0030364990234375, 0.012683868408203125, 0.02233123779296875, 0.031978607177734375, 0.0416259765625, 0.051273345947265625, 0.06092071533203125, 0.07056808471679688, 0.0802154541015625, 0.08986282348632812, 0.09951019287109375, 0.10915756225585938, 0.118804931640625, 0.12845230102539062, 0.13809967041015625, 0.14774703979492188, 0.1573944091796875, 0.16704177856445312, 0.17668914794921875, 0.18633651733398438, 0.19598388671875, 0.20563125610351562, 0.21527862548828125, 0.22492599487304688, 0.2345733642578125, 0.24422073364257812, 0.25386810302734375, 0.2635154724121094, 0.273162841796875, 0.2828102111816406, 0.29245758056640625, 0.3021049499511719, 0.3117523193359375, 0.3213996887207031, 0.33104705810546875, 0.3406944274902344, 0.350341796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 16.0, 19.0, 49.0, 125.0, 774.0, 10.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.145597457885742, -26.68362045288086, -26.22164535522461, -25.759668350219727, -25.297691345214844, -24.83571434020996, -24.37373924255371, -23.911762237548828, -23.449785232543945, -22.987808227539062, -22.525833129882812, -22.06385612487793, -21.601879119873047, -21.139902114868164, -20.677927017211914, -20.21595001220703, -19.75397491455078, -19.2919979095459, -18.83002281188965, -18.368045806884766, -17.906068801879883, -17.444091796875, -16.98211669921875, -16.520139694213867, -16.058162689208984, -15.596186637878418, -15.134209632873535, -14.672233581542969, -14.210256576538086, -13.74828052520752, -13.286304473876953, -12.82432746887207, -12.362349510192871, -11.900373458862305, -11.438396453857422, -10.976420402526855, -10.514443397521973, -10.052467346191406, -9.590490341186523, -9.128514289855957, -8.66653823852539, -8.204562187194824, -7.742585182189941, -7.280609130859375, -6.818632125854492, -6.356656074523926, -5.894679546356201, -5.432703018188477, -4.970726013183594, -4.508749485015869, -4.0467729568481445, -3.584796667098999, -3.1228201389312744, -2.66084361076355, -2.1988673210144043, -1.7368907928466797, -1.274914264678955, -0.8129377961158752, -0.3509613275527954, 0.11101508140563965, 0.5729916095733643, 1.0349681377410889, 1.4969444274902344, 1.958920955657959, 2.4208974838256836]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 11.0, 14.0, 25.0, 22.0, 36.0, 53.0, 48.0, 68.0, 81.0, 84.0, 100.0, 87.0, 74.0, 56.0, 51.0, 36.0, 29.0, 17.0, 22.0, 18.0, 16.0, 12.0, 6.0, 7.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0666534900665283, -1.9883503913879395, -1.9100474119186401, -1.8317443132400513, -1.7534412145614624, -1.675138235092163, -1.5968351364135742, -1.5185320377349854, -1.4402289390563965, -1.3619258403778076, -1.2836228609085083, -1.2053197622299194, -1.1270166635513306, -1.0487136840820312, -0.9704105854034424, -0.8921074867248535, -0.8138045072555542, -0.7355014681816101, -0.6571983695030212, -0.5788953304290771, -0.5005922317504883, -0.4222891926765442, -0.3439861536026001, -0.26568305492401123, -0.18738001585006714, -0.10907695442438126, -0.030773892998695374, 0.04752916097640991, 0.1258322298526764, 0.20413529872894287, 0.28243833780288696, 0.36074143648147583, 0.4390444755554199, 0.517347514629364, 0.5956506133079529, 0.673953652381897, 0.7522567510604858, 0.8305597901344299, 0.908862829208374, 0.9871659278869629, 1.0654690265655518, 1.1437721252441406, 1.22207510471344, 1.3003782033920288, 1.3786813020706177, 1.456984281539917, 1.5352873802185059, 1.6135904788970947, 1.691893458366394, 1.770196557044983, 1.8484995365142822, 1.926802635192871, 2.00510573387146, 2.083408832550049, 2.1617116928100586, 2.2400150299072266, 2.3183178901672363, 2.396620988845825, 2.474924087524414, 2.553226947784424, 2.6315300464630127, 2.7098331451416016, 2.7881362438201904, 2.8664393424987793, 2.944742441177368]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 34.0, 44.0, 67.0, 78.0, 138.0, 186.0, 274.0, 437.0, 787.0, 1407.0, 2899.0, 7423.0, 31859.0, 952385.0, 35723.0, 7804.0, 3115.0, 1592.0, 897.0, 494.0, 287.0, 157.0, 108.0, 85.0, 51.0, 44.0, 26.0, 24.0, 12.0, 17.0, 8.0, 12.0, 5.0, 7.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1689453125, -1.131866455078125, -1.09478759765625, -1.057708740234375, -1.0206298828125, -0.983551025390625, -0.94647216796875, -0.909393310546875, -0.872314453125, -0.835235595703125, -0.79815673828125, -0.761077880859375, -0.7239990234375, -0.686920166015625, -0.64984130859375, -0.612762451171875, -0.57568359375, -0.538604736328125, -0.50152587890625, -0.464447021484375, -0.4273681640625, -0.390289306640625, -0.35321044921875, -0.316131591796875, -0.279052734375, -0.241973876953125, -0.20489501953125, -0.167816162109375, -0.1307373046875, -0.093658447265625, -0.05657958984375, -0.019500732421875, 0.017578125, 0.054656982421875, 0.09173583984375, 0.128814697265625, 0.1658935546875, 0.202972412109375, 0.24005126953125, 0.277130126953125, 0.314208984375, 0.351287841796875, 0.38836669921875, 0.425445556640625, 0.4625244140625, 0.499603271484375, 0.53668212890625, 0.573760986328125, 0.61083984375, 0.647918701171875, 0.68499755859375, 0.722076416015625, 0.7591552734375, 0.796234130859375, 0.83331298828125, 0.870391845703125, 0.907470703125, 0.944549560546875, 0.98162841796875, 1.018707275390625, 1.0557861328125, 1.092864990234375, 1.12994384765625, 1.167022705078125, 1.2041015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 2.0, 10.0, 6.0, 12.0, 6.0, 6.0, 14.0, 46.0, 121.0, 217.0, 243.0, 138.0, 60.0, 17.0, 7.0, 7.0, 10.0, 8.0, 1.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17138671875, -0.1659564971923828, -0.16052627563476562, -0.15509605407714844, -0.14966583251953125, -0.14423561096191406, -0.13880538940429688, -0.1333751678466797, -0.1279449462890625, -0.12251472473144531, -0.11708450317382812, -0.11165428161621094, -0.10622406005859375, -0.10079383850097656, -0.09536361694335938, -0.08993339538574219, -0.084503173828125, -0.07907295227050781, -0.07364273071289062, -0.06821250915527344, -0.06278228759765625, -0.05735206604003906, -0.051921844482421875, -0.04649162292480469, -0.0410614013671875, -0.03563117980957031, -0.030200958251953125, -0.024770736694335938, -0.01934051513671875, -0.013910293579101562, -0.008480072021484375, -0.0030498504638671875, 0.00238037109375, 0.0078105926513671875, 0.013240814208984375, 0.018671035766601562, 0.02410125732421875, 0.029531478881835938, 0.034961700439453125, 0.04039192199707031, 0.0458221435546875, 0.05125236511230469, 0.056682586669921875, 0.06211280822753906, 0.06754302978515625, 0.07297325134277344, 0.07840347290039062, 0.08383369445800781, 0.089263916015625, 0.09469413757324219, 0.10012435913085938, 0.10555458068847656, 0.11098480224609375, 0.11641502380371094, 0.12184524536132812, 0.1272754669189453, 0.1327056884765625, 0.1381359100341797, 0.14356613159179688, 0.14899635314941406, 0.15442657470703125, 0.15985679626464844, 0.16528701782226562, 0.1707172393798828, 0.1761474609375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 17.0, 10.0, 13.0, 13.0, 22.0, 30.0, 48.0, 67.0, 84.0, 109.0, 161.0, 266.0, 372.0, 641.0, 1134.0, 2264.0, 5576.0, 16758.0, 71960.0, 776058.0, 133967.0, 24816.0, 7611.0, 2968.0, 1435.0, 768.0, 442.0, 277.0, 172.0, 141.0, 108.0, 63.0, 34.0, 30.0, 31.0, 22.0, 17.0, 10.0, 3.0, 3.0, 9.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5874099731445312, -0.5669097900390625, -0.5464096069335938, -0.525909423828125, -0.5054092407226562, -0.4849090576171875, -0.46440887451171875, -0.44390869140625, -0.42340850830078125, -0.4029083251953125, -0.38240814208984375, -0.361907958984375, -0.34140777587890625, -0.3209075927734375, -0.30040740966796875, -0.2799072265625, -0.25940704345703125, -0.2389068603515625, -0.21840667724609375, -0.197906494140625, -0.17740631103515625, -0.1569061279296875, -0.13640594482421875, -0.11590576171875, -0.09540557861328125, -0.0749053955078125, -0.05440521240234375, -0.033905029296875, -0.01340484619140625, 0.0070953369140625, 0.02759552001953125, 0.048095703125, 0.06859588623046875, 0.0890960693359375, 0.10959625244140625, 0.130096435546875, 0.15059661865234375, 0.1710968017578125, 0.19159698486328125, 0.21209716796875, 0.23259735107421875, 0.2530975341796875, 0.27359771728515625, 0.294097900390625, 0.31459808349609375, 0.3350982666015625, 0.35559844970703125, 0.3760986328125, 0.39659881591796875, 0.4170989990234375, 0.43759918212890625, 0.458099365234375, 0.47859954833984375, 0.4990997314453125, 0.5195999145507812, 0.54010009765625, 0.5606002807617188, 0.5811004638671875, 0.6016006469726562, 0.622100830078125, 0.6426010131835938, 0.6631011962890625, 0.6836013793945312, 0.7041015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 8.0, 4.0, 5.0, 10.0, 11.0, 13.0, 14.0, 22.0, 29.0, 27.0, 21.0, 34.0, 29.0, 32.0, 41.0, 36.0, 37.0, 54.0, 49.0, 46.0, 45.0, 53.0, 40.0, 40.0, 47.0, 39.0, 30.0, 38.0, 24.0, 18.0, 22.0, 21.0, 9.0, 16.0, 7.0, 9.0, 5.0, 2.0, 2.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.386474609375, -0.3737983703613281, -0.36112213134765625, -0.3484458923339844, -0.3357696533203125, -0.3230934143066406, -0.31041717529296875, -0.2977409362792969, -0.285064697265625, -0.2723884582519531, -0.25971221923828125, -0.24703598022460938, -0.2343597412109375, -0.22168350219726562, -0.20900726318359375, -0.19633102416992188, -0.18365478515625, -0.17097854614257812, -0.15830230712890625, -0.14562606811523438, -0.1329498291015625, -0.12027359008789062, -0.10759735107421875, -0.09492111206054688, -0.082244873046875, -0.06956863403320312, -0.05689239501953125, -0.044216156005859375, -0.0315399169921875, -0.018863677978515625, -0.00618743896484375, 0.006488800048828125, 0.0191650390625, 0.031841278076171875, 0.04451751708984375, 0.057193756103515625, 0.0698699951171875, 0.08254623413085938, 0.09522247314453125, 0.10789871215820312, 0.120574951171875, 0.13325119018554688, 0.14592742919921875, 0.15860366821289062, 0.1712799072265625, 0.18395614624023438, 0.19663238525390625, 0.20930862426757812, 0.22198486328125, 0.23466110229492188, 0.24733734130859375, 0.2600135803222656, 0.2726898193359375, 0.2853660583496094, 0.29804229736328125, 0.3107185363769531, 0.323394775390625, 0.3360710144042969, 0.34874725341796875, 0.3614234924316406, 0.3740997314453125, 0.3867759704589844, 0.39945220947265625, 0.4121284484863281, 0.4248046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 8.0, 20.0, 26.0, 48.0, 83.0, 125.0, 194.0, 369.0, 704.0, 1582.0, 4066.0, 14710.0, 929119.0, 82800.0, 9246.0, 2912.0, 1231.0, 576.0, 272.0, 174.0, 92.0, 71.0, 44.0, 19.0, 16.0, 16.0, 10.0, 2.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.05067253112792969, -0.049129486083984375, -0.04758644104003906, -0.04604339599609375, -0.04450035095214844, -0.042957305908203125, -0.04141426086425781, -0.0398712158203125, -0.03832817077636719, -0.036785125732421875, -0.03524208068847656, -0.03369903564453125, -0.03215599060058594, -0.030612945556640625, -0.029069900512695312, -0.02752685546875, -0.025983810424804688, -0.024440765380859375, -0.022897720336914062, -0.02135467529296875, -0.019811630249023438, -0.018268585205078125, -0.016725540161132812, -0.0151824951171875, -0.013639450073242188, -0.012096405029296875, -0.010553359985351562, -0.00901031494140625, -0.0074672698974609375, -0.005924224853515625, -0.0043811798095703125, -0.002838134765625, -0.0012950897216796875, 0.000247955322265625, 0.0017910003662109375, 0.00333404541015625, 0.0048770904541015625, 0.006420135498046875, 0.007963180541992188, 0.0095062255859375, 0.011049270629882812, 0.012592315673828125, 0.014135360717773438, 0.01567840576171875, 0.017221450805664062, 0.018764495849609375, 0.020307540893554688, 0.0218505859375, 0.023393630981445312, 0.024936676025390625, 0.026479721069335938, 0.02802276611328125, 0.029565811157226562, 0.031108856201171875, 0.03265190124511719, 0.0341949462890625, 0.03573799133300781, 0.037281036376953125, 0.03882408142089844, 0.04036712646484375, 0.04191017150878906, 0.043453216552734375, 0.04499626159667969, 0.046539306640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 5.0, 8.0, 12.0, 7.0, 13.0, 46.0, 270.0, 379.0, 162.0, 35.0, 21.0, 5.0, 9.0, 5.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.655122756958008e-05, -4.533771425485611e-05, -4.412420094013214e-05, -4.291068762540817e-05, -4.1697174310684204e-05, -4.0483660995960236e-05, -3.927014768123627e-05, -3.80566343665123e-05, -3.684312105178833e-05, -3.562960773706436e-05, -3.441609442234039e-05, -3.3202581107616425e-05, -3.1989067792892456e-05, -3.077555447816849e-05, -2.956204116344452e-05, -2.834852784872055e-05, -2.7135014533996582e-05, -2.5921501219272614e-05, -2.4707987904548645e-05, -2.3494474589824677e-05, -2.2280961275100708e-05, -2.106744796037674e-05, -1.985393464565277e-05, -1.8640421330928802e-05, -1.7426908016204834e-05, -1.6213394701480865e-05, -1.4999881386756897e-05, -1.3786368072032928e-05, -1.257285475730896e-05, -1.1359341442584991e-05, -1.0145828127861023e-05, -8.932314813137054e-06, -7.718801498413086e-06, -6.5052881836891174e-06, -5.291774868965149e-06, -4.07826155424118e-06, -2.864748239517212e-06, -1.6512349247932434e-06, -4.377216100692749e-07, 7.757917046546936e-07, 1.989305019378662e-06, 3.2028183341026306e-06, 4.416331648826599e-06, 5.629844963550568e-06, 6.843358278274536e-06, 8.056871592998505e-06, 9.270384907722473e-06, 1.0483898222446442e-05, 1.169741153717041e-05, 1.2910924851894379e-05, 1.4124438166618347e-05, 1.5337951481342316e-05, 1.6551464796066284e-05, 1.7764978110790253e-05, 1.897849142551422e-05, 2.019200474023819e-05, 2.1405518054962158e-05, 2.2619031369686127e-05, 2.3832544684410095e-05, 2.5046057999134064e-05, 2.6259571313858032e-05, 2.7473084628582e-05, 2.868659794330597e-05, 2.9900111258029938e-05, 3.1113624572753906e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 3.0, 8.0, 8.0, 10.0, 12.0, 14.0, 30.0, 56.0, 60.0, 141.0, 229.0, 525.0, 1327.0, 4344.0, 38908.0, 980525.0, 17437.0, 2953.0, 987.0, 416.0, 214.0, 112.0, 85.0, 43.0, 32.0, 16.0, 15.0, 9.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.059844970703125, -0.05810356140136719, -0.056362152099609375, -0.05462074279785156, -0.05287933349609375, -0.05113792419433594, -0.049396514892578125, -0.04765510559082031, -0.0459136962890625, -0.04417228698730469, -0.042430877685546875, -0.04068946838378906, -0.03894805908203125, -0.03720664978027344, -0.035465240478515625, -0.03372383117675781, -0.031982421875, -0.030241012573242188, -0.028499603271484375, -0.026758193969726562, -0.02501678466796875, -0.023275375366210938, -0.021533966064453125, -0.019792556762695312, -0.0180511474609375, -0.016309738159179688, -0.014568328857421875, -0.012826919555664062, -0.01108551025390625, -0.009344100952148438, -0.007602691650390625, -0.0058612823486328125, -0.004119873046875, -0.0023784637451171875, -0.000637054443359375, 0.0011043548583984375, 0.00284576416015625, 0.0045871734619140625, 0.006328582763671875, 0.008069992065429688, 0.0098114013671875, 0.011552810668945312, 0.013294219970703125, 0.015035629272460938, 0.01677703857421875, 0.018518447875976562, 0.020259857177734375, 0.022001266479492188, 0.02374267578125, 0.025484085083007812, 0.027225494384765625, 0.028966903686523438, 0.03070831298828125, 0.03244972229003906, 0.034191131591796875, 0.03593254089355469, 0.0376739501953125, 0.03941535949707031, 0.041156768798828125, 0.04289817810058594, 0.04463958740234375, 0.04638099670410156, 0.048122406005859375, 0.04986381530761719, 0.051605224609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 11.0, 6.0, 25.0, 36.0, 55.0, 104.0, 210.0, 209.0, 136.0, 65.0, 51.0, 23.0, 12.0, 12.0, 9.0, 7.0, 6.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03668212890625, -0.035666704177856445, -0.03465127944946289, -0.033635854721069336, -0.03262042999267578, -0.03160500526428223, -0.030589580535888672, -0.029574155807495117, -0.028558731079101562, -0.027543306350708008, -0.026527881622314453, -0.0255124568939209, -0.024497032165527344, -0.02348160743713379, -0.022466182708740234, -0.02145075798034668, -0.020435333251953125, -0.01941990852355957, -0.018404483795166016, -0.01738905906677246, -0.016373634338378906, -0.015358209609985352, -0.014342784881591797, -0.013327360153198242, -0.012311935424804688, -0.011296510696411133, -0.010281085968017578, -0.009265661239624023, -0.008250236511230469, -0.007234811782836914, -0.006219387054443359, -0.005203962326049805, -0.00418853759765625, -0.0031731128692626953, -0.0021576881408691406, -0.001142263412475586, -0.00012683868408203125, 0.0008885860443115234, 0.0019040107727050781, 0.002919435501098633, 0.0039348602294921875, 0.004950284957885742, 0.005965709686279297, 0.0069811344146728516, 0.007996559143066406, 0.009011983871459961, 0.010027408599853516, 0.01104283332824707, 0.012058258056640625, 0.01307368278503418, 0.014089107513427734, 0.015104532241821289, 0.016119956970214844, 0.0171353816986084, 0.018150806427001953, 0.019166231155395508, 0.020181655883789062, 0.021197080612182617, 0.022212505340576172, 0.023227930068969727, 0.02424335479736328, 0.025258779525756836, 0.02627420425415039, 0.027289628982543945, 0.0283050537109375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 10.0, 9.0, 17.0, 34.0, 50.0, 93.0, 134.0, 284.0, 138.0, 60.0, 33.0, 30.0, 21.0, 12.0, 15.0, 6.0, 3.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9477934837341309, -1.8714975118637085, -1.7952015399932861, -1.7189056873321533, -1.642609715461731, -1.5663137435913086, -1.4900178909301758, -1.4137219190597534, -1.337425947189331, -1.2611299753189087, -1.1848340034484863, -1.1085381507873535, -1.0322421789169312, -0.9559462070465088, -0.8796502947807312, -0.8033543825149536, -0.7270584106445312, -0.6507624387741089, -0.5744665265083313, -0.4981705844402313, -0.42187464237213135, -0.34557870030403137, -0.2692827582359314, -0.1929868459701538, -0.11669087409973145, -0.04039493203163147, 0.035901010036468506, 0.11219695210456848, 0.18849289417266846, 0.26478883624076843, 0.3410847783088684, 0.417380690574646, 0.49367666244506836, 0.5699726343154907, 0.6462685465812683, 0.7225644588470459, 0.7988604307174683, 0.8751564025878906, 0.9514523148536682, 1.0277482271194458, 1.1040441989898682, 1.1803401708602905, 1.256636142730713, 1.3329319953918457, 1.409227967262268, 1.4855239391326904, 1.5618197917938232, 1.6381157636642456, 1.714411735534668, 1.7907077074050903, 1.8670036792755127, 1.9432995319366455, 2.0195956230163574, 2.0958914756774902, 2.172187328338623, 2.248483180999756, 2.3247792720794678, 2.4010751247406006, 2.4773712158203125, 2.5536670684814453, 2.629962921142578, 2.70625901222229, 2.782554864883423, 2.8588509559631348, 2.9351468086242676]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 11.0, 3.0, 11.0, 22.0, 34.0, 19.0, 36.0, 50.0, 39.0, 68.0, 71.0, 61.0, 81.0, 76.0, 73.0, 61.0, 47.0, 48.0, 29.0, 34.0, 28.0, 16.0, 15.0, 9.0, 10.0, 11.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9447269439697266, -1.8745737075805664, -1.8044204711914062, -1.734267234802246, -1.664113998413086, -1.5939607620239258, -1.5238075256347656, -1.4536542892456055, -1.3835010528564453, -1.3133478164672852, -1.243194580078125, -1.1730413436889648, -1.1028881072998047, -1.0327348709106445, -0.9625815749168396, -0.8924283385276794, -0.8222750425338745, -0.7521218061447144, -0.6819685697555542, -0.611815333366394, -0.5416620969772339, -0.47150883078575134, -0.4013555645942688, -0.33120232820510864, -0.2610490918159485, -0.19089585542678833, -0.12074260413646698, -0.05058935284614563, 0.019563883543014526, 0.08971711993217468, 0.15987038612365723, 0.23002362251281738, 0.30017685890197754, 0.3703300952911377, 0.44048333168029785, 0.510636568069458, 0.5807898044586182, 0.6509430408477783, 0.7210963368415833, 0.7912495732307434, 0.8614028096199036, 0.9315560460090637, 1.0017093420028687, 1.0718625783920288, 1.142015814781189, 1.2121690511703491, 1.2823222875595093, 1.3524755239486694, 1.4226287603378296, 1.4927819967269897, 1.56293523311615, 1.63308846950531, 1.7032417058944702, 1.7733949422836304, 1.84354829788208, 1.9137015342712402, 1.9838547706604004, 2.0540080070495605, 2.1241612434387207, 2.194314479827881, 2.264467716217041, 2.334620952606201, 2.4047741889953613, 2.4749274253845215, 2.5450806617736816]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 10.0, 8.0, 18.0, 19.0, 15.0, 43.0, 100.0, 211.0, 570.0, 4191238.0, 1421.0, 229.0, 129.0, 64.0, 53.0, 29.0, 25.0, 19.0, 12.0, 14.0, 5.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.38671875, -5.21722412109375, -5.0477294921875, -4.87823486328125, -4.708740234375, -4.53924560546875, -4.3697509765625, -4.20025634765625, -4.03076171875, -3.86126708984375, -3.6917724609375, -3.52227783203125, -3.352783203125, -3.18328857421875, -3.0137939453125, -2.84429931640625, -2.6748046875, -2.50531005859375, -2.3358154296875, -2.16632080078125, -1.996826171875, -1.82733154296875, -1.6578369140625, -1.48834228515625, -1.31884765625, -1.14935302734375, -0.9798583984375, -0.81036376953125, -0.640869140625, -0.47137451171875, -0.3018798828125, -0.13238525390625, 0.037109375, 0.20660400390625, 0.3760986328125, 0.54559326171875, 0.715087890625, 0.88458251953125, 1.0540771484375, 1.22357177734375, 1.39306640625, 1.56256103515625, 1.7320556640625, 1.90155029296875, 2.071044921875, 2.24053955078125, 2.4100341796875, 2.57952880859375, 2.7490234375, 2.91851806640625, 3.0880126953125, 3.25750732421875, 3.427001953125, 3.59649658203125, 3.7659912109375, 3.93548583984375, 4.10498046875, 4.27447509765625, 4.4439697265625, 4.61346435546875, 4.782958984375, 4.95245361328125, 5.1219482421875, 5.29144287109375, 5.4609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 7.0, 11.0, 9.0, 8.0, 22.0, 56.0, 116.0, 177.0, 214.0, 163.0, 78.0, 26.0, 11.0, 9.0, 6.0, 8.0, 4.0, 11.0, 10.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.161865234375, -0.15675926208496094, -0.15165328979492188, -0.1465473175048828, -0.14144134521484375, -0.1363353729248047, -0.13122940063476562, -0.12612342834472656, -0.1210174560546875, -0.11591148376464844, -0.11080551147460938, -0.10569953918457031, -0.10059356689453125, -0.09548759460449219, -0.09038162231445312, -0.08527565002441406, -0.080169677734375, -0.07506370544433594, -0.06995773315429688, -0.06485176086425781, -0.05974578857421875, -0.05463981628417969, -0.049533843994140625, -0.04442787170410156, -0.0393218994140625, -0.03421592712402344, -0.029109954833984375, -0.024003982543945312, -0.01889801025390625, -0.013792037963867188, -0.008686065673828125, -0.0035800933837890625, 0.00152587890625, 0.0066318511962890625, 0.011737823486328125, 0.016843795776367188, 0.02194976806640625, 0.027055740356445312, 0.032161712646484375, 0.03726768493652344, 0.0423736572265625, 0.04747962951660156, 0.052585601806640625, 0.05769157409667969, 0.06279754638671875, 0.06790351867675781, 0.07300949096679688, 0.07811546325683594, 0.083221435546875, 0.08832740783691406, 0.09343338012695312, 0.09853935241699219, 0.10364532470703125, 0.10875129699707031, 0.11385726928710938, 0.11896324157714844, 0.1240692138671875, 0.12917518615722656, 0.13428115844726562, 0.1393871307373047, 0.14449310302734375, 0.1495990753173828, 0.15470504760742188, 0.15981101989746094, 0.1649169921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 4.0, 8.0, 8.0, 22.0, 21.0, 25.0, 39.0, 54.0, 63.0, 75.0, 114.0, 159.0, 266.0, 386.0, 717.0, 1387.0, 3752.0, 15056.0, 751966.0, 3394800.0, 17248.0, 4381.0, 1689.0, 784.0, 434.0, 262.0, 187.0, 118.0, 70.0, 55.0, 38.0, 29.0, 16.0, 13.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.290283203125, -0.2819995880126953, -0.2737159729003906, -0.26543235778808594, -0.25714874267578125, -0.24886512756347656, -0.24058151245117188, -0.2322978973388672, -0.2240142822265625, -0.2157306671142578, -0.20744705200195312, -0.19916343688964844, -0.19087982177734375, -0.18259620666503906, -0.17431259155273438, -0.1660289764404297, -0.157745361328125, -0.1494617462158203, -0.14117813110351562, -0.13289451599121094, -0.12461090087890625, -0.11632728576660156, -0.10804367065429688, -0.09976005554199219, -0.0914764404296875, -0.08319282531738281, -0.07490921020507812, -0.06662559509277344, -0.05834197998046875, -0.05005836486816406, -0.041774749755859375, -0.03349113464355469, -0.02520751953125, -0.016923904418945312, -0.008640289306640625, -0.0003566741943359375, 0.00792694091796875, 0.016210556030273438, 0.024494171142578125, 0.03277778625488281, 0.0410614013671875, 0.04934501647949219, 0.057628631591796875, 0.06591224670410156, 0.07419586181640625, 0.08247947692871094, 0.09076309204101562, 0.09904670715332031, 0.107330322265625, 0.11561393737792969, 0.12389755249023438, 0.13218116760253906, 0.14046478271484375, 0.14874839782714844, 0.15703201293945312, 0.1653156280517578, 0.1735992431640625, 0.1818828582763672, 0.19016647338867188, 0.19845008850097656, 0.20673370361328125, 0.21501731872558594, 0.22330093383789062, 0.2315845489501953, 0.2398681640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 14.0, 22.0, 40.0, 178.0, 2390.0, 1229.0, 106.0, 34.0, 15.0, 8.0, 10.0, 4.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.3621864318847656, -0.35181427001953125, -0.3414421081542969, -0.3310699462890625, -0.3206977844238281, -0.31032562255859375, -0.2999534606933594, -0.289581298828125, -0.2792091369628906, -0.26883697509765625, -0.2584648132324219, -0.2480926513671875, -0.23772048950195312, -0.22734832763671875, -0.21697616577148438, -0.20660400390625, -0.19623184204101562, -0.18585968017578125, -0.17548751831054688, -0.1651153564453125, -0.15474319458007812, -0.14437103271484375, -0.13399887084960938, -0.123626708984375, -0.11325454711914062, -0.10288238525390625, -0.09251022338867188, -0.0821380615234375, -0.07176589965820312, -0.06139373779296875, -0.051021575927734375, -0.0406494140625, -0.030277252197265625, -0.01990509033203125, -0.009532928466796875, 0.0008392333984375, 0.011211395263671875, 0.02158355712890625, 0.031955718994140625, 0.042327880859375, 0.052700042724609375, 0.06307220458984375, 0.07344436645507812, 0.0838165283203125, 0.09418869018554688, 0.10456085205078125, 0.11493301391601562, 0.12530517578125, 0.13567733764648438, 0.14604949951171875, 0.15642166137695312, 0.1667938232421875, 0.17716598510742188, 0.18753814697265625, 0.19791030883789062, 0.208282470703125, 0.21865463256835938, 0.22902679443359375, 0.23939895629882812, 0.2497711181640625, 0.2601432800292969, 0.27051544189453125, 0.2808876037597656, 0.291259765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 10.0, 3.0, 8.0, 7.0, 12.0, 19.0, 17.0, 23.0, 34.0, 35.0, 73.0, 73.0, 138.0, 271.0, 149.0, 64.0, 27.0, 12.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.121859073638916, -1.090567946434021, -1.0592769384384155, -1.0279858112335205, -0.996694803237915, -0.96540367603302, -0.9341126084327698, -0.9028215408325195, -0.8715304732322693, -0.840239405632019, -0.8089483380317688, -0.7776572704315186, -0.7463661432266235, -0.7150751352310181, -0.683784008026123, -0.6524929404258728, -0.6212018728256226, -0.5899108052253723, -0.5586197376251221, -0.5273286700248718, -0.4960375726222992, -0.46474650502204895, -0.4334554076194763, -0.4021643400192261, -0.37087327241897583, -0.3395822048187256, -0.30829113721847534, -0.2770000398159027, -0.24570897221565247, -0.21441790461540222, -0.18312682211399078, -0.15183573961257935, -0.12054455280303955, -0.08925347775220871, -0.05796240270137787, -0.026671327650547028, 0.0046197474002838135, 0.03591081500053406, 0.0672018975019455, 0.09849298000335693, 0.12978404760360718, 0.16107511520385742, 0.19236619770526886, 0.2236572802066803, 0.25494834780693054, 0.2862394154071808, 0.3175305128097534, 0.34882158041000366, 0.3801126480102539, 0.41140371561050415, 0.4426947832107544, 0.473985880613327, 0.5052769184112549, 0.5365680456161499, 0.5678591132164001, 0.5991501808166504, 0.6304412484169006, 0.6617323160171509, 0.6930233836174011, 0.7243144512176514, 0.7556055784225464, 0.7868965864181519, 0.8181877136230469, 0.8494787812232971, 0.8807698488235474]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 7.0, 15.0, 26.0, 18.0, 24.0, 32.0, 27.0, 40.0, 37.0, 50.0, 46.0, 43.0, 60.0, 43.0, 43.0, 51.0, 37.0, 51.0, 43.0, 32.0, 36.0, 36.0, 30.0, 19.0, 15.0, 20.0, 23.0, 14.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6329599618911743, -0.6111306548118591, -0.5893012881278992, -0.567471981048584, -0.5456426739692688, -0.5238133072853088, -0.5019840002059937, -0.4801546633243561, -0.4583253264427185, -0.43649598956108093, -0.41466668248176575, -0.3928373456001282, -0.3710080087184906, -0.349178671836853, -0.32734936475753784, -0.30552002787590027, -0.2836907207965851, -0.2618613839149475, -0.24003206193447113, -0.21820273995399475, -0.19637340307235718, -0.1745440810918808, -0.15271475911140442, -0.13088542222976685, -0.10905610024929047, -0.08722677081823349, -0.06539744138717651, -0.043568119406700134, -0.021738789975643158, 9.053945541381836e-05, 0.021919861435890198, 0.04374919831752777, 0.06557852029800415, 0.08740784972906113, 0.1092371791601181, 0.13106650114059448, 0.15289583802223206, 0.17472516000270844, 0.19655448198318481, 0.2183838188648224, 0.24021314084529877, 0.26204246282577515, 0.2838717997074127, 0.3057011365890503, 0.3275304436683655, 0.34935978055000305, 0.3711891174316406, 0.3930184245109558, 0.4148477613925934, 0.43667709827423096, 0.45850640535354614, 0.4803357422351837, 0.5021650791168213, 0.5239943861961365, 0.5458236932754517, 0.5676530599594116, 0.5894823670387268, 0.611311674118042, 0.633141040802002, 0.6549703478813171, 0.6767996549606323, 0.6986290216445923, 0.7204583287239075, 0.7422876358032227, 0.7641170024871826]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 5.0, 7.0, 13.0, 9.0, 14.0, 16.0, 12.0, 36.0, 48.0, 71.0, 93.0, 118.0, 178.0, 248.0, 351.0, 498.0, 621.0, 886.0, 1164.0, 1804.0, 2778.0, 4770.0, 8604.0, 20656.0, 101173.0, 783270.0, 81444.0, 18790.0, 7874.0, 4407.0, 2715.0, 1647.0, 1179.0, 803.0, 589.0, 387.0, 320.0, 245.0, 187.0, 117.0, 89.0, 80.0, 58.0, 47.0, 29.0, 31.0, 22.0, 16.0, 12.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 4.0], "bins": [-0.287353515625, -0.2787628173828125, -0.270172119140625, -0.2615814208984375, -0.25299072265625, -0.2444000244140625, -0.235809326171875, -0.2272186279296875, -0.2186279296875, -0.2100372314453125, -0.201446533203125, -0.1928558349609375, -0.18426513671875, -0.1756744384765625, -0.167083740234375, -0.1584930419921875, -0.14990234375, -0.1413116455078125, -0.132720947265625, -0.1241302490234375, -0.11553955078125, -0.1069488525390625, -0.098358154296875, -0.0897674560546875, -0.0811767578125, -0.0725860595703125, -0.063995361328125, -0.0554046630859375, -0.04681396484375, -0.0382232666015625, -0.029632568359375, -0.0210418701171875, -0.012451171875, -0.0038604736328125, 0.004730224609375, 0.0133209228515625, 0.02191162109375, 0.0305023193359375, 0.039093017578125, 0.0476837158203125, 0.0562744140625, 0.0648651123046875, 0.073455810546875, 0.0820465087890625, 0.09063720703125, 0.0992279052734375, 0.107818603515625, 0.1164093017578125, 0.125, 0.1335906982421875, 0.142181396484375, 0.1507720947265625, 0.15936279296875, 0.1679534912109375, 0.176544189453125, 0.1851348876953125, 0.1937255859375, 0.2023162841796875, 0.210906982421875, 0.2194976806640625, 0.22808837890625, 0.2366790771484375, 0.245269775390625, 0.2538604736328125, 0.262451171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 7.0, 20.0, 43.0, 67.0, 131.0, 167.0, 167.0, 129.0, 99.0, 35.0, 15.0, 9.0, 4.0, 6.0, 11.0, 8.0, 10.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.164794921875, -0.1598796844482422, -0.15496444702148438, -0.15004920959472656, -0.14513397216796875, -0.14021873474121094, -0.13530349731445312, -0.1303882598876953, -0.1254730224609375, -0.12055778503417969, -0.11564254760742188, -0.11072731018066406, -0.10581207275390625, -0.10089683532714844, -0.09598159790039062, -0.09106636047363281, -0.086151123046875, -0.08123588562011719, -0.07632064819335938, -0.07140541076660156, -0.06649017333984375, -0.06157493591308594, -0.056659698486328125, -0.05174446105957031, -0.0468292236328125, -0.04191398620605469, -0.036998748779296875, -0.03208351135253906, -0.02716827392578125, -0.022253036499023438, -0.017337799072265625, -0.012422561645507812, -0.00750732421875, -0.0025920867919921875, 0.002323150634765625, 0.0072383880615234375, 0.01215362548828125, 0.017068862915039062, 0.021984100341796875, 0.026899337768554688, 0.0318145751953125, 0.03672981262207031, 0.041645050048828125, 0.04656028747558594, 0.05147552490234375, 0.05639076232910156, 0.061305999755859375, 0.06622123718261719, 0.071136474609375, 0.07605171203613281, 0.08096694946289062, 0.08588218688964844, 0.09079742431640625, 0.09571266174316406, 0.10062789916992188, 0.10554313659667969, 0.1104583740234375, 0.11537361145019531, 0.12028884887695312, 0.12520408630371094, 0.13011932373046875, 0.13503456115722656, 0.13994979858398438, 0.1448650360107422, 0.1497802734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 11.0, 7.0, 8.0, 17.0, 24.0, 20.0, 40.0, 47.0, 72.0, 81.0, 121.0, 185.0, 298.0, 504.0, 954.0, 2611.0, 12376.0, 141467.0, 840443.0, 40234.0, 5757.0, 1520.0, 641.0, 355.0, 221.0, 144.0, 99.0, 75.0, 57.0, 44.0, 30.0, 24.0, 17.0, 19.0, 10.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4775390625, -0.4612274169921875, -0.444915771484375, -0.4286041259765625, -0.41229248046875, -0.3959808349609375, -0.379669189453125, -0.3633575439453125, -0.3470458984375, -0.3307342529296875, -0.314422607421875, -0.2981109619140625, -0.28179931640625, -0.2654876708984375, -0.249176025390625, -0.2328643798828125, -0.216552734375, -0.2002410888671875, -0.183929443359375, -0.1676177978515625, -0.15130615234375, -0.1349945068359375, -0.118682861328125, -0.1023712158203125, -0.0860595703125, -0.0697479248046875, -0.053436279296875, -0.0371246337890625, -0.02081298828125, -0.0045013427734375, 0.011810302734375, 0.0281219482421875, 0.04443359375, 0.0607452392578125, 0.077056884765625, 0.0933685302734375, 0.10968017578125, 0.1259918212890625, 0.142303466796875, 0.1586151123046875, 0.1749267578125, 0.1912384033203125, 0.207550048828125, 0.2238616943359375, 0.24017333984375, 0.2564849853515625, 0.272796630859375, 0.2891082763671875, 0.305419921875, 0.3217315673828125, 0.338043212890625, 0.3543548583984375, 0.37066650390625, 0.3869781494140625, 0.403289794921875, 0.4196014404296875, 0.4359130859375, 0.4522247314453125, 0.468536376953125, 0.4848480224609375, 0.50115966796875, 0.5174713134765625, 0.533782958984375, 0.5500946044921875, 0.56640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 9.0, 17.0, 16.0, 16.0, 23.0, 19.0, 30.0, 43.0, 48.0, 47.0, 55.0, 43.0, 44.0, 50.0, 50.0, 57.0, 50.0, 50.0, 44.0, 46.0, 37.0, 38.0, 24.0, 22.0, 24.0, 24.0, 8.0, 15.0, 12.0, 9.0, 1.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43212890625, -0.4173126220703125, -0.402496337890625, -0.3876800537109375, -0.37286376953125, -0.3580474853515625, -0.343231201171875, -0.3284149169921875, -0.3135986328125, -0.2987823486328125, -0.283966064453125, -0.2691497802734375, -0.25433349609375, -0.2395172119140625, -0.224700927734375, -0.2098846435546875, -0.195068359375, -0.1802520751953125, -0.165435791015625, -0.1506195068359375, -0.13580322265625, -0.1209869384765625, -0.106170654296875, -0.0913543701171875, -0.0765380859375, -0.0617218017578125, -0.046905517578125, -0.0320892333984375, -0.01727294921875, -0.0024566650390625, 0.012359619140625, 0.0271759033203125, 0.0419921875, 0.0568084716796875, 0.071624755859375, 0.0864410400390625, 0.10125732421875, 0.1160736083984375, 0.130889892578125, 0.1457061767578125, 0.1605224609375, 0.1753387451171875, 0.190155029296875, 0.2049713134765625, 0.21978759765625, 0.2346038818359375, 0.249420166015625, 0.2642364501953125, 0.279052734375, 0.2938690185546875, 0.308685302734375, 0.3235015869140625, 0.33831787109375, 0.3531341552734375, 0.367950439453125, 0.3827667236328125, 0.3975830078125, 0.4123992919921875, 0.427215576171875, 0.4420318603515625, 0.45684814453125, 0.4716644287109375, 0.486480712890625, 0.5012969970703125, 0.51611328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 14.0, 27.0, 26.0, 65.0, 85.0, 141.0, 275.0, 593.0, 1811.0, 9375.0, 795425.0, 231662.0, 6531.0, 1365.0, 497.0, 249.0, 116.0, 76.0, 58.0, 35.0, 27.0, 16.0, 12.0, 9.0, 8.0, 4.0, 6.0, 6.0, 7.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-0.08758544921875, -0.08539152145385742, -0.08319759368896484, -0.08100366592407227, -0.07880973815917969, -0.07661581039428711, -0.07442188262939453, -0.07222795486450195, -0.07003402709960938, -0.0678400993347168, -0.06564617156982422, -0.06345224380493164, -0.06125831604003906, -0.059064388275146484, -0.056870460510253906, -0.05467653274536133, -0.05248260498046875, -0.05028867721557617, -0.048094749450683594, -0.045900821685791016, -0.04370689392089844, -0.04151296615600586, -0.03931903839111328, -0.0371251106262207, -0.034931182861328125, -0.03273725509643555, -0.03054332733154297, -0.02834939956665039, -0.026155471801757812, -0.023961544036865234, -0.021767616271972656, -0.019573688507080078, -0.0173797607421875, -0.015185832977294922, -0.012991905212402344, -0.010797977447509766, -0.008604049682617188, -0.006410121917724609, -0.004216194152832031, -0.002022266387939453, 0.000171661376953125, 0.002365589141845703, 0.004559516906738281, 0.006753444671630859, 0.008947372436523438, 0.011141300201416016, 0.013335227966308594, 0.015529155731201172, 0.01772308349609375, 0.019917011260986328, 0.022110939025878906, 0.024304866790771484, 0.026498794555664062, 0.02869272232055664, 0.03088665008544922, 0.0330805778503418, 0.035274505615234375, 0.03746843338012695, 0.03966236114501953, 0.04185628890991211, 0.04405021667480469, 0.046244144439697266, 0.048438072204589844, 0.05063199996948242, 0.052825927734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 10.0, 4.0, 14.0, 11.0, 13.0, 15.0, 22.0, 26.0, 32.0, 45.0, 46.0, 47.0, 43.0, 48.0, 77.0, 64.0, 66.0, 60.0, 61.0, 42.0, 48.0, 45.0, 28.0, 20.0, 17.0, 14.0, 11.0, 19.0, 8.0, 5.0, 10.0, 6.0, 5.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.927417755126953e-06, -7.692724466323853e-06, -7.458031177520752e-06, -7.223337888717651e-06, -6.988644599914551e-06, -6.75395131111145e-06, -6.51925802230835e-06, -6.284564733505249e-06, -6.0498714447021484e-06, -5.815178155899048e-06, -5.580484867095947e-06, -5.345791578292847e-06, -5.111098289489746e-06, -4.8764050006866455e-06, -4.641711711883545e-06, -4.407018423080444e-06, -4.172325134277344e-06, -3.937631845474243e-06, -3.7029385566711426e-06, -3.468245267868042e-06, -3.2335519790649414e-06, -2.998858690261841e-06, -2.7641654014587402e-06, -2.5294721126556396e-06, -2.294778823852539e-06, -2.0600855350494385e-06, -1.8253922462463379e-06, -1.5906989574432373e-06, -1.3560056686401367e-06, -1.1213123798370361e-06, -8.866190910339355e-07, -6.51925802230835e-07, -4.172325134277344e-07, -1.825392246246338e-07, 5.21540641784668e-08, 2.868473529815674e-07, 5.21540641784668e-07, 7.562339305877686e-07, 9.909272193908691e-07, 1.2256205081939697e-06, 1.4603137969970703e-06, 1.695007085800171e-06, 1.9297003746032715e-06, 2.164393663406372e-06, 2.3990869522094727e-06, 2.6337802410125732e-06, 2.868473529815674e-06, 3.1031668186187744e-06, 3.337860107421875e-06, 3.5725533962249756e-06, 3.807246685028076e-06, 4.041939973831177e-06, 4.276633262634277e-06, 4.511326551437378e-06, 4.7460198402404785e-06, 4.980713129043579e-06, 5.21540641784668e-06, 5.45009970664978e-06, 5.684792995452881e-06, 5.9194862842559814e-06, 6.154179573059082e-06, 6.388872861862183e-06, 6.623566150665283e-06, 6.858259439468384e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 5.0, 3.0, 8.0, 8.0, 11.0, 12.0, 18.0, 18.0, 37.0, 49.0, 57.0, 115.0, 182.0, 331.0, 689.0, 1685.0, 5777.0, 36873.0, 872956.0, 114277.0, 10707.0, 2736.0, 949.0, 431.0, 193.0, 121.0, 82.0, 59.0, 42.0, 25.0, 22.0, 15.0, 18.0, 10.0, 6.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04278564453125, -0.041391849517822266, -0.03999805450439453, -0.0386042594909668, -0.03721046447753906, -0.03581666946411133, -0.034422874450683594, -0.03302907943725586, -0.031635284423828125, -0.03024148941040039, -0.028847694396972656, -0.027453899383544922, -0.026060104370117188, -0.024666309356689453, -0.02327251434326172, -0.021878719329833984, -0.02048492431640625, -0.019091129302978516, -0.01769733428955078, -0.016303539276123047, -0.014909744262695312, -0.013515949249267578, -0.012122154235839844, -0.01072835922241211, -0.009334564208984375, -0.00794076919555664, -0.006546974182128906, -0.005153179168701172, -0.0037593841552734375, -0.002365589141845703, -0.0009717941284179688, 0.0004220008850097656, 0.0018157958984375, 0.0032095909118652344, 0.004603385925292969, 0.005997180938720703, 0.0073909759521484375, 0.008784770965576172, 0.010178565979003906, 0.01157236099243164, 0.012966156005859375, 0.01435995101928711, 0.015753746032714844, 0.017147541046142578, 0.018541336059570312, 0.019935131072998047, 0.02132892608642578, 0.022722721099853516, 0.02411651611328125, 0.025510311126708984, 0.02690410614013672, 0.028297901153564453, 0.029691696166992188, 0.031085491180419922, 0.032479286193847656, 0.03387308120727539, 0.035266876220703125, 0.03666067123413086, 0.038054466247558594, 0.03944826126098633, 0.04084205627441406, 0.0422358512878418, 0.04362964630126953, 0.045023441314697266, 0.046417236328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 4.0, 12.0, 12.0, 14.0, 18.0, 25.0, 38.0, 40.0, 51.0, 55.0, 60.0, 86.0, 91.0, 82.0, 71.0, 81.0, 52.0, 49.0, 33.0, 26.0, 20.0, 10.0, 10.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041534423828125, -0.040216922760009766, -0.03889942169189453, -0.0375819206237793, -0.03626441955566406, -0.03494691848754883, -0.033629417419433594, -0.03231191635131836, -0.030994415283203125, -0.02967691421508789, -0.028359413146972656, -0.027041912078857422, -0.025724411010742188, -0.024406909942626953, -0.02308940887451172, -0.021771907806396484, -0.02045440673828125, -0.019136905670166016, -0.01781940460205078, -0.016501903533935547, -0.015184402465820312, -0.013866901397705078, -0.012549400329589844, -0.01123189926147461, -0.009914398193359375, -0.00859689712524414, -0.007279396057128906, -0.005961894989013672, -0.0046443939208984375, -0.003326892852783203, -0.0020093917846679688, -0.0006918907165527344, 0.0006256103515625, 0.0019431114196777344, 0.0032606124877929688, 0.004578113555908203, 0.0058956146240234375, 0.007213115692138672, 0.008530616760253906, 0.00984811782836914, 0.011165618896484375, 0.01248311996459961, 0.013800621032714844, 0.015118122100830078, 0.016435623168945312, 0.017753124237060547, 0.01907062530517578, 0.020388126373291016, 0.02170562744140625, 0.023023128509521484, 0.02434062957763672, 0.025658130645751953, 0.026975631713867188, 0.028293132781982422, 0.029610633850097656, 0.03092813491821289, 0.032245635986328125, 0.03356313705444336, 0.034880638122558594, 0.03619813919067383, 0.03751564025878906, 0.0388331413269043, 0.04015064239501953, 0.041468143463134766, 0.04278564453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 14.0, 37.0, 164.0, 588.0, 134.0, 41.0, 14.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.919511795043945, -7.771296501159668, -7.623081207275391, -7.474865436553955, -7.326650142669678, -7.1784348487854, -7.030219078063965, -6.8820037841796875, -6.73378849029541, -6.585573196411133, -6.4373579025268555, -6.28914213180542, -6.140926837921143, -5.992711544036865, -5.84449577331543, -5.696280479431152, -5.548065185546875, -5.399849891662598, -5.25163459777832, -5.103418827056885, -4.955203533172607, -4.80698823928833, -4.6587724685668945, -4.510557174682617, -4.36234188079834, -4.2141265869140625, -4.065911293029785, -3.9176955223083496, -3.7694802284240723, -3.621264934539795, -3.4730494022369385, -3.324833869934082, -3.1766185760498047, -3.0284032821655273, -2.880187749862671, -2.7319722175598145, -2.583756923675537, -2.4355416297912598, -2.2873260974884033, -2.139110565185547, -1.9908952713012695, -1.8426798582077026, -1.6944644451141357, -1.5462490320205688, -1.398033618927002, -1.249818205833435, -1.1016027927398682, -0.9533873796463013, -0.8051719665527344, -0.6569565534591675, -0.5087411403656006, -0.3605257272720337, -0.2123103141784668, -0.0640949010848999, 0.08412051200866699, 0.2323359251022339, 0.3805513381958008, 0.5287667512893677, 0.6769821643829346, 0.8251975774765015, 0.9734129905700684, 1.1216284036636353, 1.2698438167572021, 1.418059229850769, 1.566274642944336]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 10.0, 7.0, 9.0, 12.0, 15.0, 13.0, 21.0, 12.0, 19.0, 31.0, 16.0, 32.0, 30.0, 42.0, 48.0, 41.0, 60.0, 72.0, 61.0, 62.0, 44.0, 48.0, 28.0, 42.0, 32.0, 21.0, 24.0, 16.0, 23.0, 11.0, 13.0, 13.0, 13.0, 11.0, 3.0, 10.0, 5.0, 9.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.577056884765625, -1.526253342628479, -1.475449800491333, -1.4246461391448975, -1.3738425970077515, -1.3230390548706055, -1.2722355127334595, -1.2214319705963135, -1.170628309249878, -1.119824767112732, -1.069021224975586, -1.0182175636291504, -0.9674140214920044, -0.9166104793548584, -0.8658069372177124, -0.8150033950805664, -0.7641998529434204, -0.7133963108062744, -0.6625927090644836, -0.6117891669273376, -0.5609855651855469, -0.5101820230484009, -0.4593784809112549, -0.4085749089717865, -0.3577713370323181, -0.30696776509284973, -0.25616419315338135, -0.20536065101623535, -0.15455707907676697, -0.10375350713729858, -0.05294996500015259, -0.002146393060684204, 0.04865729808807373, 0.09946086257696152, 0.1502644270658493, 0.2010679841041565, 0.2518715560436249, 0.30267512798309326, 0.35347867012023926, 0.40428224205970764, 0.455085813999176, 0.505889356136322, 0.5566929578781128, 0.6074965000152588, 0.6583000421524048, 0.7091036438941956, 0.7599071860313416, 0.8107107877731323, 0.8615143299102783, 0.9123178720474243, 0.9631214737892151, 1.0139250755310059, 1.0647286176681519, 1.1155321598052979, 1.1663357019424438, 1.2171392440795898, 1.2679429054260254, 1.3187464475631714, 1.3695499897003174, 1.420353651046753, 1.471157193183899, 1.521960735321045, 1.572764277458191, 1.623567819595337, 1.674371361732483]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 0.0, 4.0, 5.0, 2.0, 5.0, 6.0, 12.0, 10.0, 8.0, 12.0, 9.0, 18.0, 35.0, 47.0, 43.0, 83.0, 135.0, 246.0, 486.0, 4035.0, 53292.0, 4044722.0, 84193.0, 5240.0, 741.0, 275.0, 151.0, 98.0, 81.0, 49.0, 39.0, 32.0, 24.0, 20.0, 21.0, 16.0, 24.0, 12.0, 19.0, 10.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2467041015625, -0.2393646240234375, -0.232025146484375, -0.2246856689453125, -0.21734619140625, -0.2100067138671875, -0.202667236328125, -0.1953277587890625, -0.18798828125, -0.1806488037109375, -0.173309326171875, -0.1659698486328125, -0.15863037109375, -0.1512908935546875, -0.143951416015625, -0.1366119384765625, -0.1292724609375, -0.1219329833984375, -0.114593505859375, -0.1072540283203125, -0.09991455078125, -0.0925750732421875, -0.085235595703125, -0.0778961181640625, -0.070556640625, -0.0632171630859375, -0.055877685546875, -0.0485382080078125, -0.04119873046875, -0.0338592529296875, -0.026519775390625, -0.0191802978515625, -0.0118408203125, -0.0045013427734375, 0.002838134765625, 0.0101776123046875, 0.01751708984375, 0.0248565673828125, 0.032196044921875, 0.0395355224609375, 0.046875, 0.0542144775390625, 0.061553955078125, 0.0688934326171875, 0.07623291015625, 0.0835723876953125, 0.090911865234375, 0.0982513427734375, 0.1055908203125, 0.1129302978515625, 0.120269775390625, 0.1276092529296875, 0.13494873046875, 0.1422882080078125, 0.149627685546875, 0.1569671630859375, 0.164306640625, 0.1716461181640625, 0.178985595703125, 0.1863250732421875, 0.19366455078125, 0.2010040283203125, 0.208343505859375, 0.2156829833984375, 0.2230224609375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 12.0, 12.0, 19.0, 36.0, 47.0, 68.0, 94.0, 125.0, 129.0, 130.0, 85.0, 64.0, 33.0, 29.0, 21.0, 18.0, 6.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.162109375, -0.1573162078857422, -0.15252304077148438, -0.14772987365722656, -0.14293670654296875, -0.13814353942871094, -0.13335037231445312, -0.1285572052001953, -0.1237640380859375, -0.11897087097167969, -0.11417770385742188, -0.10938453674316406, -0.10459136962890625, -0.09979820251464844, -0.09500503540039062, -0.09021186828613281, -0.085418701171875, -0.08062553405761719, -0.07583236694335938, -0.07103919982910156, -0.06624603271484375, -0.06145286560058594, -0.056659698486328125, -0.05186653137207031, -0.0470733642578125, -0.04228019714355469, -0.037487030029296875, -0.03269386291503906, -0.02790069580078125, -0.023107528686523438, -0.018314361572265625, -0.013521194458007812, -0.00872802734375, -0.0039348602294921875, 0.000858306884765625, 0.0056514739990234375, 0.01044464111328125, 0.015237808227539062, 0.020030975341796875, 0.024824142456054688, 0.0296173095703125, 0.03441047668457031, 0.039203643798828125, 0.04399681091308594, 0.04878997802734375, 0.05358314514160156, 0.058376312255859375, 0.06316947937011719, 0.067962646484375, 0.07275581359863281, 0.07754898071289062, 0.08234214782714844, 0.08713531494140625, 0.09192848205566406, 0.09672164916992188, 0.10151481628417969, 0.1063079833984375, 0.11110115051269531, 0.11589431762695312, 0.12068748474121094, 0.12548065185546875, 0.13027381896972656, 0.13506698608398438, 0.1398601531982422, 0.1446533203125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 27.0, 39.0, 88.0, 133.0, 329.0, 868.0, 2945.0, 16185.0, 4052015.0, 113347.0, 6014.0, 1354.0, 446.0, 216.0, 106.0, 51.0, 44.0, 19.0, 13.0, 11.0, 8.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2232666015625, -0.21550941467285156, -0.20775222778320312, -0.1999950408935547, -0.19223785400390625, -0.1844806671142578, -0.17672348022460938, -0.16896629333496094, -0.1612091064453125, -0.15345191955566406, -0.14569473266601562, -0.1379375457763672, -0.13018035888671875, -0.12242317199707031, -0.11466598510742188, -0.10690879821777344, -0.099151611328125, -0.09139442443847656, -0.08363723754882812, -0.07588005065917969, -0.06812286376953125, -0.06036567687988281, -0.052608489990234375, -0.04485130310058594, -0.0370941162109375, -0.029336929321289062, -0.021579742431640625, -0.013822555541992188, -0.00606536865234375, 0.0016918182373046875, 0.009449005126953125, 0.017206192016601562, 0.02496337890625, 0.03272056579589844, 0.040477752685546875, 0.04823493957519531, 0.05599212646484375, 0.06374931335449219, 0.07150650024414062, 0.07926368713378906, 0.0870208740234375, 0.09477806091308594, 0.10253524780273438, 0.11029243469238281, 0.11804962158203125, 0.1258068084716797, 0.13356399536132812, 0.14132118225097656, 0.149078369140625, 0.15683555603027344, 0.16459274291992188, 0.1723499298095703, 0.18010711669921875, 0.1878643035888672, 0.19562149047851562, 0.20337867736816406, 0.2111358642578125, 0.21889305114746094, 0.22665023803710938, 0.2344074249267578, 0.24216461181640625, 0.2499217987060547, 0.2576789855957031, 0.26543617248535156, 0.273193359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 4.0, 13.0, 19.0, 33.0, 120.0, 761.0, 2423.0, 521.0, 87.0, 33.0, 11.0, 12.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182861328125, -0.174713134765625, -0.16656494140625, -0.158416748046875, -0.1502685546875, -0.142120361328125, -0.13397216796875, -0.125823974609375, -0.11767578125, -0.109527587890625, -0.10137939453125, -0.093231201171875, -0.0850830078125, -0.076934814453125, -0.06878662109375, -0.060638427734375, -0.052490234375, -0.044342041015625, -0.03619384765625, -0.028045654296875, -0.0198974609375, -0.011749267578125, -0.00360107421875, 0.004547119140625, 0.0126953125, 0.020843505859375, 0.02899169921875, 0.037139892578125, 0.0452880859375, 0.053436279296875, 0.06158447265625, 0.069732666015625, 0.077880859375, 0.086029052734375, 0.09417724609375, 0.102325439453125, 0.1104736328125, 0.118621826171875, 0.12677001953125, 0.134918212890625, 0.14306640625, 0.151214599609375, 0.15936279296875, 0.167510986328125, 0.1756591796875, 0.183807373046875, 0.19195556640625, 0.200103759765625, 0.208251953125, 0.216400146484375, 0.22454833984375, 0.232696533203125, 0.2408447265625, 0.248992919921875, 0.25714111328125, 0.265289306640625, 0.2734375, 0.281585693359375, 0.28973388671875, 0.297882080078125, 0.3060302734375, 0.314178466796875, 0.32232666015625, 0.330474853515625, 0.338623046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 16.0, 24.0, 97.0, 407.0, 348.0, 67.0, 20.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0483574867248535, -1.994523048400879, -1.9406887292861938, -1.8868542909622192, -1.8330199718475342, -1.7791855335235596, -1.725351095199585, -1.6715167760849, -1.6176823377609253, -1.5638478994369507, -1.5100135803222656, -1.456179141998291, -1.402344822883606, -1.3485103845596313, -1.2946760654449463, -1.2408416271209717, -1.187007188796997, -1.1331727504730225, -1.0793384313583374, -1.0255039930343628, -0.971669614315033, -0.9178352355957031, -0.8640008568763733, -0.8101664781570435, -0.7563321590423584, -0.7024977803230286, -0.6486634016036987, -0.5948289632797241, -0.5409945845603943, -0.48716020584106445, -0.4333258271217346, -0.3794914186000824, -0.3256570100784302, -0.27182263135910034, -0.21798822283744812, -0.1641538441181183, -0.11031945049762726, -0.05648505687713623, -0.0026506781578063965, 0.051183730363845825, 0.10501810908317566, 0.1588525027036667, 0.21268689632415771, 0.26652127504348755, 0.3203556537628174, 0.3741900622844696, 0.42802444100379944, 0.48185884952545166, 0.5356932282447815, 0.5895276069641113, 0.6433619856834412, 0.697196364402771, 0.7510308027267456, 0.8048651814460754, 0.8586995601654053, 0.9125339984893799, 0.9663683176040649, 1.0202027559280396, 1.0740370750427246, 1.1278715133666992, 1.1817058324813843, 1.2355402708053589, 1.289374589920044, 1.3432090282440186, 1.3970434665679932]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 8.0, 11.0, 18.0, 25.0, 27.0, 45.0, 50.0, 60.0, 63.0, 67.0, 74.0, 87.0, 83.0, 73.0, 68.0, 51.0, 53.0, 34.0, 35.0, 22.0, 18.0, 8.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2464652061462402, -1.21738600730896, -1.1883066892623901, -1.1592274904251099, -1.1301482915878296, -1.1010689735412598, -1.0719897747039795, -1.0429105758666992, -1.013831377029419, -0.9847521185874939, -0.9556729197502136, -0.9265936613082886, -0.8975144624710083, -0.8684352040290833, -0.8393559455871582, -0.8102767467498779, -0.7811974287033081, -0.7521181702613831, -0.7230389714241028, -0.6939597129821777, -0.6648805141448975, -0.6358012557029724, -0.6067219972610474, -0.5776427984237671, -0.5485635995864868, -0.5194843411445618, -0.4904051423072815, -0.46132588386535645, -0.4322466552257538, -0.4031674265861511, -0.37408819794654846, -0.3450089693069458, -0.31592971086502075, -0.2868504822254181, -0.25777125358581543, -0.22869201004505157, -0.19961276650428772, -0.17053353786468506, -0.1414543092250824, -0.11237506568431854, -0.08329583704471588, -0.05421660095453262, -0.025137368589639664, 0.003941863775253296, 0.033021099865436554, 0.06210033595561981, 0.09117956459522247, 0.12025880813598633, 0.149338036775589, 0.17841726541519165, 0.2074965089559555, 0.23657573759555817, 0.265654981136322, 0.2947342097759247, 0.32381343841552734, 0.3528926968574524, 0.38197189569473267, 0.4110511243343353, 0.440130352973938, 0.46920961141586304, 0.4982888400554657, 0.5273680686950684, 0.5564472675323486, 0.5855265259742737, 0.6146057844161987]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 10.0, 8.0, 12.0, 16.0, 15.0, 25.0, 31.0, 68.0, 70.0, 121.0, 161.0, 236.0, 339.0, 607.0, 798.0, 1244.0, 1946.0, 3386.0, 6553.0, 14979.0, 48816.0, 369902.0, 507315.0, 58839.0, 16757.0, 6956.0, 3561.0, 1992.0, 1175.0, 782.0, 574.0, 401.0, 253.0, 181.0, 119.0, 98.0, 54.0, 42.0, 22.0, 24.0, 15.0, 10.0, 11.0, 9.0, 7.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.14306640625, -0.13873863220214844, -0.13441085815429688, -0.1300830841064453, -0.12575531005859375, -0.12142753601074219, -0.11709976196289062, -0.11277198791503906, -0.1084442138671875, -0.10411643981933594, -0.09978866577148438, -0.09546089172363281, -0.09113311767578125, -0.08680534362792969, -0.08247756958007812, -0.07814979553222656, -0.073822021484375, -0.06949424743652344, -0.06516647338867188, -0.06083869934082031, -0.05651092529296875, -0.05218315124511719, -0.047855377197265625, -0.04352760314941406, -0.0391998291015625, -0.03487205505371094, -0.030544281005859375, -0.026216506958007812, -0.02188873291015625, -0.017560958862304688, -0.013233184814453125, -0.008905410766601562, -0.00457763671875, -0.0002498626708984375, 0.004077911376953125, 0.008405685424804688, 0.01273345947265625, 0.017061233520507812, 0.021389007568359375, 0.025716781616210938, 0.0300445556640625, 0.03437232971191406, 0.038700103759765625, 0.04302787780761719, 0.04735565185546875, 0.05168342590332031, 0.056011199951171875, 0.06033897399902344, 0.064666748046875, 0.06899452209472656, 0.07332229614257812, 0.07765007019042969, 0.08197784423828125, 0.08630561828613281, 0.09063339233398438, 0.09496116638183594, 0.0992889404296875, 0.10361671447753906, 0.10794448852539062, 0.11227226257324219, 0.11660003662109375, 0.12092781066894531, 0.12525558471679688, 0.12958335876464844, 0.1339111328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 9.0, 10.0, 9.0, 21.0, 31.0, 51.0, 63.0, 93.0, 120.0, 126.0, 135.0, 84.0, 68.0, 41.0, 36.0, 19.0, 12.0, 14.0, 7.0, 9.0, 7.0, 0.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.15767860412597656, -0.15288162231445312, -0.1480846405029297, -0.14328765869140625, -0.1384906768798828, -0.13369369506835938, -0.12889671325683594, -0.1240997314453125, -0.11930274963378906, -0.11450576782226562, -0.10970878601074219, -0.10491180419921875, -0.10011482238769531, -0.09531784057617188, -0.09052085876464844, -0.085723876953125, -0.08092689514160156, -0.07612991333007812, -0.07133293151855469, -0.06653594970703125, -0.06173896789550781, -0.056941986083984375, -0.05214500427246094, -0.0473480224609375, -0.04255104064941406, -0.037754058837890625, -0.03295707702636719, -0.02816009521484375, -0.023363113403320312, -0.018566131591796875, -0.013769149780273438, -0.00897216796875, -0.0041751861572265625, 0.000621795654296875, 0.0054187774658203125, 0.01021575927734375, 0.015012741088867188, 0.019809722900390625, 0.024606704711914062, 0.0294036865234375, 0.03420066833496094, 0.038997650146484375, 0.04379463195800781, 0.04859161376953125, 0.05338859558105469, 0.058185577392578125, 0.06298255920410156, 0.067779541015625, 0.07257652282714844, 0.07737350463867188, 0.08217048645019531, 0.08696746826171875, 0.09176445007324219, 0.09656143188476562, 0.10135841369628906, 0.1061553955078125, 0.11095237731933594, 0.11574935913085938, 0.12054634094238281, 0.12534332275390625, 0.1301403045654297, 0.13493728637695312, 0.13973426818847656, 0.14453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 7.0, 9.0, 10.0, 18.0, 26.0, 22.0, 34.0, 55.0, 72.0, 90.0, 138.0, 196.0, 355.0, 653.0, 1594.0, 6604.0, 68235.0, 902051.0, 59182.0, 6059.0, 1476.0, 613.0, 336.0, 204.0, 121.0, 90.0, 80.0, 42.0, 42.0, 32.0, 23.0, 20.0, 15.0, 12.0, 9.0, 9.0, 5.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3093299865722656, -0.29883575439453125, -0.2883415222167969, -0.2778472900390625, -0.2673530578613281, -0.25685882568359375, -0.24636459350585938, -0.235870361328125, -0.22537612915039062, -0.21488189697265625, -0.20438766479492188, -0.1938934326171875, -0.18339920043945312, -0.17290496826171875, -0.16241073608398438, -0.15191650390625, -0.14142227172851562, -0.13092803955078125, -0.12043380737304688, -0.1099395751953125, -0.09944534301757812, -0.08895111083984375, -0.07845687866210938, -0.067962646484375, -0.057468414306640625, -0.04697418212890625, -0.036479949951171875, -0.0259857177734375, -0.015491485595703125, -0.00499725341796875, 0.005496978759765625, 0.0159912109375, 0.026485443115234375, 0.03697967529296875, 0.047473907470703125, 0.0579681396484375, 0.06846237182617188, 0.07895660400390625, 0.08945083618164062, 0.099945068359375, 0.11043930053710938, 0.12093353271484375, 0.13142776489257812, 0.1419219970703125, 0.15241622924804688, 0.16291046142578125, 0.17340469360351562, 0.18389892578125, 0.19439315795898438, 0.20488739013671875, 0.21538162231445312, 0.2258758544921875, 0.23637008666992188, 0.24686431884765625, 0.2573585510253906, 0.267852783203125, 0.2783470153808594, 0.28884124755859375, 0.2993354797363281, 0.3098297119140625, 0.3203239440917969, 0.33081817626953125, 0.3413124084472656, 0.351806640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 6.0, 5.0, 8.0, 14.0, 10.0, 14.0, 13.0, 33.0, 24.0, 37.0, 40.0, 38.0, 45.0, 51.0, 57.0, 57.0, 54.0, 57.0, 33.0, 50.0, 47.0, 44.0, 43.0, 27.0, 36.0, 31.0, 17.0, 19.0, 15.0, 16.0, 8.0, 15.0, 9.0, 8.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36669921875, -0.3547935485839844, -0.34288787841796875, -0.3309822082519531, -0.3190765380859375, -0.3071708679199219, -0.29526519775390625, -0.2833595275878906, -0.271453857421875, -0.2595481872558594, -0.24764251708984375, -0.23573684692382812, -0.2238311767578125, -0.21192550659179688, -0.20001983642578125, -0.18811416625976562, -0.17620849609375, -0.16430282592773438, -0.15239715576171875, -0.14049148559570312, -0.1285858154296875, -0.11668014526367188, -0.10477447509765625, -0.09286880493164062, -0.080963134765625, -0.06905746459960938, -0.05715179443359375, -0.045246124267578125, -0.0333404541015625, -0.021434783935546875, -0.00952911376953125, 0.002376556396484375, 0.0142822265625, 0.026187896728515625, 0.03809356689453125, 0.049999237060546875, 0.0619049072265625, 0.07381057739257812, 0.08571624755859375, 0.09762191772460938, 0.109527587890625, 0.12143325805664062, 0.13333892822265625, 0.14524459838867188, 0.1571502685546875, 0.16905593872070312, 0.18096160888671875, 0.19286727905273438, 0.20477294921875, 0.21667861938476562, 0.22858428955078125, 0.24048995971679688, 0.2523956298828125, 0.2643013000488281, 0.27620697021484375, 0.2881126403808594, 0.300018310546875, 0.3119239807128906, 0.32382965087890625, 0.3357353210449219, 0.3476409912109375, 0.3595466613769531, 0.37145233154296875, 0.3833580017089844, 0.395263671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 2.0, 26.0, 25.0, 69.0, 98.0, 340.0, 1643.0, 24865.0, 1005866.0, 13926.0, 1200.0, 274.0, 91.0, 60.0, 18.0, 25.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.060394287109375, -0.05810880661010742, -0.055823326110839844, -0.053537845611572266, -0.05125236511230469, -0.04896688461303711, -0.04668140411376953, -0.04439592361450195, -0.042110443115234375, -0.0398249626159668, -0.03753948211669922, -0.03525400161743164, -0.03296852111816406, -0.030683040618896484, -0.028397560119628906, -0.026112079620361328, -0.02382659912109375, -0.021541118621826172, -0.019255638122558594, -0.016970157623291016, -0.014684677124023438, -0.01239919662475586, -0.010113716125488281, -0.007828235626220703, -0.005542755126953125, -0.003257274627685547, -0.0009717941284179688, 0.0013136863708496094, 0.0035991668701171875, 0.005884647369384766, 0.008170127868652344, 0.010455608367919922, 0.0127410888671875, 0.015026569366455078, 0.017312049865722656, 0.019597530364990234, 0.021883010864257812, 0.02416849136352539, 0.02645397186279297, 0.028739452362060547, 0.031024932861328125, 0.0333104133605957, 0.03559589385986328, 0.03788137435913086, 0.04016685485839844, 0.042452335357666016, 0.044737815856933594, 0.04702329635620117, 0.04930877685546875, 0.05159425735473633, 0.053879737854003906, 0.056165218353271484, 0.05845069885253906, 0.06073617935180664, 0.06302165985107422, 0.0653071403503418, 0.06759262084960938, 0.06987810134887695, 0.07216358184814453, 0.07444906234741211, 0.07673454284667969, 0.07902002334594727, 0.08130550384521484, 0.08359098434448242, 0.08587646484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 6.0, 17.0, 18.0, 9.0, 30.0, 17.0, 30.0, 35.0, 60.0, 52.0, 51.0, 73.0, 66.0, 72.0, 62.0, 72.0, 58.0, 51.0, 50.0, 34.0, 28.0, 16.0, 19.0, 8.0, 11.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.900859832763672e-06, -5.688518285751343e-06, -5.476176738739014e-06, -5.2638351917266846e-06, -5.0514936447143555e-06, -4.839152097702026e-06, -4.626810550689697e-06, -4.414469003677368e-06, -4.202127456665039e-06, -3.98978590965271e-06, -3.777444362640381e-06, -3.5651028156280518e-06, -3.3527612686157227e-06, -3.1404197216033936e-06, -2.9280781745910645e-06, -2.7157366275787354e-06, -2.5033950805664062e-06, -2.291053533554077e-06, -2.078711986541748e-06, -1.866370439529419e-06, -1.6540288925170898e-06, -1.4416873455047607e-06, -1.2293457984924316e-06, -1.0170042514801025e-06, -8.046627044677734e-07, -5.923211574554443e-07, -3.7997961044311523e-07, -1.6763806343078613e-07, 4.470348358154297e-08, 2.5704503059387207e-07, 4.6938657760620117e-07, 6.817281246185303e-07, 8.940696716308594e-07, 1.1064112186431885e-06, 1.3187527656555176e-06, 1.5310943126678467e-06, 1.7434358596801758e-06, 1.955777406692505e-06, 2.168118953704834e-06, 2.380460500717163e-06, 2.592802047729492e-06, 2.8051435947418213e-06, 3.0174851417541504e-06, 3.2298266887664795e-06, 3.4421682357788086e-06, 3.6545097827911377e-06, 3.866851329803467e-06, 4.079192876815796e-06, 4.291534423828125e-06, 4.503875970840454e-06, 4.716217517852783e-06, 4.928559064865112e-06, 5.140900611877441e-06, 5.3532421588897705e-06, 5.5655837059021e-06, 5.777925252914429e-06, 5.990266799926758e-06, 6.202608346939087e-06, 6.414949893951416e-06, 6.627291440963745e-06, 6.839632987976074e-06, 7.051974534988403e-06, 7.264316082000732e-06, 7.4766576290130615e-06, 7.68899917602539e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 14.0, 5.0, 13.0, 14.0, 24.0, 25.0, 38.0, 51.0, 93.0, 156.0, 232.0, 366.0, 822.0, 1918.0, 7088.0, 58840.0, 893899.0, 73152.0, 7881.0, 2012.0, 827.0, 372.0, 249.0, 133.0, 96.0, 60.0, 40.0, 30.0, 24.0, 9.0, 12.0, 12.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.033843994140625, -0.03289151191711426, -0.031939029693603516, -0.030986547470092773, -0.03003406524658203, -0.02908158302307129, -0.028129100799560547, -0.027176618576049805, -0.026224136352539062, -0.02527165412902832, -0.024319171905517578, -0.023366689682006836, -0.022414207458496094, -0.02146172523498535, -0.02050924301147461, -0.019556760787963867, -0.018604278564453125, -0.017651796340942383, -0.01669931411743164, -0.0157468318939209, -0.014794349670410156, -0.013841867446899414, -0.012889385223388672, -0.01193690299987793, -0.010984420776367188, -0.010031938552856445, -0.009079456329345703, -0.008126974105834961, -0.007174491882324219, -0.0062220096588134766, -0.005269527435302734, -0.004317045211791992, -0.00336456298828125, -0.002412080764770508, -0.0014595985412597656, -0.0005071163177490234, 0.00044536590576171875, 0.001397848129272461, 0.002350330352783203, 0.0033028125762939453, 0.0042552947998046875, 0.00520777702331543, 0.006160259246826172, 0.007112741470336914, 0.008065223693847656, 0.009017705917358398, 0.00997018814086914, 0.010922670364379883, 0.011875152587890625, 0.012827634811401367, 0.01378011703491211, 0.014732599258422852, 0.015685081481933594, 0.016637563705444336, 0.017590045928955078, 0.01854252815246582, 0.019495010375976562, 0.020447492599487305, 0.021399974822998047, 0.02235245704650879, 0.02330493927001953, 0.024257421493530273, 0.025209903717041016, 0.026162385940551758, 0.0271148681640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 3.0, 9.0, 17.0, 23.0, 22.0, 24.0, 31.0, 42.0, 66.0, 66.0, 82.0, 94.0, 82.0, 85.0, 84.0, 60.0, 51.0, 30.0, 20.0, 25.0, 16.0, 13.0, 11.0, 7.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032440185546875, -0.031334877014160156, -0.030229568481445312, -0.02912425994873047, -0.028018951416015625, -0.02691364288330078, -0.025808334350585938, -0.024703025817871094, -0.02359771728515625, -0.022492408752441406, -0.021387100219726562, -0.02028179168701172, -0.019176483154296875, -0.01807117462158203, -0.016965866088867188, -0.015860557556152344, -0.0147552490234375, -0.013649940490722656, -0.012544631958007812, -0.011439323425292969, -0.010334014892578125, -0.009228706359863281, -0.008123397827148438, -0.007018089294433594, -0.00591278076171875, -0.004807472229003906, -0.0037021636962890625, -0.0025968551635742188, -0.001491546630859375, -0.00038623809814453125, 0.0007190704345703125, 0.0018243789672851562, 0.0029296875, 0.004034996032714844, 0.0051403045654296875, 0.006245613098144531, 0.007350921630859375, 0.008456230163574219, 0.009561538696289062, 0.010666847229003906, 0.01177215576171875, 0.012877464294433594, 0.013982772827148438, 0.015088081359863281, 0.016193389892578125, 0.01729869842529297, 0.018404006958007812, 0.019509315490722656, 0.0206146240234375, 0.021719932556152344, 0.022825241088867188, 0.02393054962158203, 0.025035858154296875, 0.02614116668701172, 0.027246475219726562, 0.028351783752441406, 0.02945709228515625, 0.030562400817871094, 0.03166770935058594, 0.03277301788330078, 0.033878326416015625, 0.03498363494873047, 0.03608894348144531, 0.037194252014160156, 0.038299560546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 14.0, 25.0, 78.0, 380.0, 320.0, 93.0, 38.0, 21.0, 15.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.8871848583221436, -2.819753408432007, -2.75232195854187, -2.6848902702331543, -2.6174588203430176, -2.550027370452881, -2.482595920562744, -2.4151644706726074, -2.3477330207824707, -2.280301570892334, -2.2128701210021973, -2.1454384326934814, -2.0780069828033447, -2.010575532913208, -1.9431440830230713, -1.8757126331329346, -1.8082809448242188, -1.740849494934082, -1.6734179258346558, -1.605986475944519, -1.5385549068450928, -1.471123456954956, -1.4036920070648193, -1.3362605571746826, -1.2688289880752563, -1.2013975381851196, -1.1339659690856934, -1.0665345191955566, -0.9991030097007751, -0.9316715002059937, -0.8642400503158569, -0.7968085408210754, -0.7293767929077148, -0.6619452834129333, -0.5945137739181519, -0.5270823240280151, -0.45965081453323364, -0.39221930503845215, -0.32478782534599304, -0.25735634565353394, -0.18992483615875244, -0.12249334156513214, -0.05506184697151184, 0.01236964762210846, 0.07980114221572876, 0.14723265171051025, 0.21466413140296936, 0.28209561109542847, 0.34952712059020996, 0.41695863008499146, 0.48439010977745056, 0.5518215894699097, 0.6192530989646912, 0.6866846084594727, 0.7541160583496094, 0.8215475678443909, 0.8889790773391724, 0.9564105868339539, 1.0238420963287354, 1.091273546218872, 1.1587049961090088, 1.226136565208435, 1.2935680150985718, 1.360999584197998, 1.4284310340881348]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 4.0, 9.0, 5.0, 11.0, 13.0, 13.0, 14.0, 7.0, 19.0, 20.0, 13.0, 18.0, 26.0, 33.0, 29.0, 41.0, 48.0, 38.0, 44.0, 65.0, 70.0, 65.0, 48.0, 40.0, 41.0, 28.0, 23.0, 25.0, 18.0, 17.0, 17.0, 12.0, 16.0, 13.0, 15.0, 13.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0], "bins": [-1.2654128074645996, -1.2269556522369385, -1.1884984970092773, -1.1500414609909058, -1.1115843057632446, -1.0731271505355835, -1.034670114517212, -0.9962129592895508, -0.9577558040618896, -0.9192986488342285, -0.8808415532112122, -0.8423844575881958, -0.8039273023605347, -0.7654701471328735, -0.7270130515098572, -0.6885559558868408, -0.6500988006591797, -0.6116416454315186, -0.5731845498085022, -0.5347274541854858, -0.4962702989578247, -0.45781317353248596, -0.4193560481071472, -0.38089892268180847, -0.3424417972564697, -0.303984671831131, -0.26552754640579224, -0.2270704209804535, -0.18861329555511475, -0.150156170129776, -0.11169904470443726, -0.07324191927909851, -0.034784793853759766, 0.0036723315715789795, 0.042129456996917725, 0.08058658242225647, 0.11904370784759521, 0.15750083327293396, 0.1959579586982727, 0.23441508412361145, 0.2728722095489502, 0.31132933497428894, 0.3497864603996277, 0.38824358582496643, 0.4267007112503052, 0.4651578366756439, 0.5036149621009827, 0.542072057723999, 0.5805292129516602, 0.6189863681793213, 0.6574434638023376, 0.695900559425354, 0.7343577146530151, 0.7728148698806763, 0.8112719655036926, 0.849729061126709, 0.8881862163543701, 0.9266433715820312, 0.9651004672050476, 1.003557562828064, 1.042014718055725, 1.0804718732833862, 1.1189289093017578, 1.157386064529419, 1.19584321975708]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 9.0, 5.0, 13.0, 20.0, 26.0, 27.0, 40.0, 65.0, 112.0, 306.0, 1762.0, 13347.0, 150019.0, 3928566.0, 89903.0, 7684.0, 1556.0, 383.0, 155.0, 86.0, 56.0, 39.0, 31.0, 23.0, 13.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16796875, -0.16309356689453125, -0.1582183837890625, -0.15334320068359375, -0.148468017578125, -0.14359283447265625, -0.1387176513671875, -0.13384246826171875, -0.12896728515625, -0.12409210205078125, -0.1192169189453125, -0.11434173583984375, -0.109466552734375, -0.10459136962890625, -0.0997161865234375, -0.09484100341796875, -0.0899658203125, -0.08509063720703125, -0.0802154541015625, -0.07534027099609375, -0.070465087890625, -0.06558990478515625, -0.0607147216796875, -0.05583953857421875, -0.05096435546875, -0.04608917236328125, -0.0412139892578125, -0.03633880615234375, -0.031463623046875, -0.02658843994140625, -0.0217132568359375, -0.01683807373046875, -0.011962890625, -0.00708770751953125, -0.0022125244140625, 0.00266265869140625, 0.007537841796875, 0.01241302490234375, 0.0172882080078125, 0.02216339111328125, 0.02703857421875, 0.03191375732421875, 0.0367889404296875, 0.04166412353515625, 0.046539306640625, 0.05141448974609375, 0.0562896728515625, 0.06116485595703125, 0.0660400390625, 0.07091522216796875, 0.0757904052734375, 0.08066558837890625, 0.085540771484375, 0.09041595458984375, 0.0952911376953125, 0.10016632080078125, 0.10504150390625, 0.10991668701171875, 0.1147918701171875, 0.11966705322265625, 0.124542236328125, 0.12941741943359375, 0.1342926025390625, 0.13916778564453125, 0.14404296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 15.0, 12.0, 10.0, 24.0, 38.0, 42.0, 62.0, 85.0, 108.0, 134.0, 126.0, 92.0, 66.0, 56.0, 31.0, 18.0, 17.0, 13.0, 11.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.15625762939453125, -0.1515045166015625, -0.14675140380859375, -0.141998291015625, -0.13724517822265625, -0.1324920654296875, -0.12773895263671875, -0.12298583984375, -0.11823272705078125, -0.1134796142578125, -0.10872650146484375, -0.103973388671875, -0.09922027587890625, -0.0944671630859375, -0.08971405029296875, -0.0849609375, -0.08020782470703125, -0.0754547119140625, -0.07070159912109375, -0.065948486328125, -0.06119537353515625, -0.0564422607421875, -0.05168914794921875, -0.04693603515625, -0.04218292236328125, -0.0374298095703125, -0.03267669677734375, -0.027923583984375, -0.02317047119140625, -0.0184173583984375, -0.01366424560546875, -0.0089111328125, -0.00415802001953125, 0.0005950927734375, 0.00534820556640625, 0.010101318359375, 0.01485443115234375, 0.0196075439453125, 0.02436065673828125, 0.02911376953125, 0.03386688232421875, 0.0386199951171875, 0.04337310791015625, 0.048126220703125, 0.05287933349609375, 0.0576324462890625, 0.06238555908203125, 0.067138671875, 0.07189178466796875, 0.0766448974609375, 0.08139801025390625, 0.086151123046875, 0.09090423583984375, 0.0956573486328125, 0.10041046142578125, 0.10516357421875, 0.10991668701171875, 0.1146697998046875, 0.11942291259765625, 0.124176025390625, 0.12892913818359375, 0.1336822509765625, 0.13843536376953125, 0.1431884765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 9.0, 11.0, 16.0, 34.0, 57.0, 111.0, 264.0, 574.0, 1537.0, 5623.0, 81443.0, 4081643.0, 17692.0, 3381.0, 1078.0, 420.0, 172.0, 91.0, 53.0, 23.0, 15.0, 9.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.19880104064941406, -0.19264602661132812, -0.1864910125732422, -0.18033599853515625, -0.1741809844970703, -0.16802597045898438, -0.16187095642089844, -0.1557159423828125, -0.14956092834472656, -0.14340591430664062, -0.1372509002685547, -0.13109588623046875, -0.12494087219238281, -0.11878585815429688, -0.11263084411621094, -0.106475830078125, -0.10032081604003906, -0.09416580200195312, -0.08801078796386719, -0.08185577392578125, -0.07570075988769531, -0.06954574584960938, -0.06339073181152344, -0.0572357177734375, -0.05108070373535156, -0.044925689697265625, -0.03877067565917969, -0.03261566162109375, -0.026460647583007812, -0.020305633544921875, -0.014150619506835938, -0.00799560546875, -0.0018405914306640625, 0.004314422607421875, 0.010469436645507812, 0.01662445068359375, 0.022779464721679688, 0.028934478759765625, 0.03508949279785156, 0.0412445068359375, 0.04739952087402344, 0.053554534912109375, 0.05970954895019531, 0.06586456298828125, 0.07201957702636719, 0.07817459106445312, 0.08432960510253906, 0.090484619140625, 0.09663963317871094, 0.10279464721679688, 0.10894966125488281, 0.11510467529296875, 0.12125968933105469, 0.12741470336914062, 0.13356971740722656, 0.1397247314453125, 0.14587974548339844, 0.15203475952148438, 0.1581897735595703, 0.16434478759765625, 0.1704998016357422, 0.17665481567382812, 0.18280982971191406, 0.18896484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 8.0, 23.0, 43.0, 138.0, 647.0, 1945.0, 870.0, 262.0, 71.0, 19.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1947021484375, -0.18852996826171875, -0.1823577880859375, -0.17618560791015625, -0.170013427734375, -0.16384124755859375, -0.1576690673828125, -0.15149688720703125, -0.14532470703125, -0.13915252685546875, -0.1329803466796875, -0.12680816650390625, -0.120635986328125, -0.11446380615234375, -0.1082916259765625, -0.10211944580078125, -0.095947265625, -0.08977508544921875, -0.0836029052734375, -0.07743072509765625, -0.071258544921875, -0.06508636474609375, -0.0589141845703125, -0.05274200439453125, -0.04656982421875, -0.04039764404296875, -0.0342254638671875, -0.02805328369140625, -0.021881103515625, -0.01570892333984375, -0.0095367431640625, -0.00336456298828125, 0.0028076171875, 0.00897979736328125, 0.0151519775390625, 0.02132415771484375, 0.027496337890625, 0.03366851806640625, 0.0398406982421875, 0.04601287841796875, 0.05218505859375, 0.05835723876953125, 0.0645294189453125, 0.07070159912109375, 0.076873779296875, 0.08304595947265625, 0.0892181396484375, 0.09539031982421875, 0.1015625, 0.10773468017578125, 0.1139068603515625, 0.12007904052734375, 0.126251220703125, 0.13242340087890625, 0.1385955810546875, 0.14476776123046875, 0.15093994140625, 0.15711212158203125, 0.1632843017578125, 0.16945648193359375, 0.175628662109375, 0.18180084228515625, 0.1879730224609375, 0.19414520263671875, 0.2003173828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 5.0, 11.0, 34.0, 86.0, 434.0, 362.0, 37.0, 19.0, 8.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.0233511924743652, -1.982079029083252, -1.9408068656921387, -1.8995347023010254, -1.858262538909912, -1.8169903755187988, -1.7757182121276855, -1.7344460487365723, -1.693173885345459, -1.6519017219543457, -1.6106295585632324, -1.5693573951721191, -1.5280852317810059, -1.4868130683898926, -1.4455409049987793, -1.404268741607666, -1.3629964590072632, -1.32172429561615, -1.2804521322250366, -1.2391799688339233, -1.19790780544281, -1.1566356420516968, -1.1153634786605835, -1.0740911960601807, -1.0328190326690674, -0.9915468692779541, -0.9502747058868408, -0.9090025424957275, -0.8677303791046143, -0.826458215713501, -0.7851859927177429, -0.7439138293266296, -0.7026417255401611, -0.6613695621490479, -0.6200973987579346, -0.5788252353668213, -0.537553071975708, -0.49628087878227234, -0.45500868558883667, -0.4137365221977234, -0.3724643588066101, -0.3311921954154968, -0.28992003202438354, -0.24864783883094788, -0.2073756754398346, -0.1661035120487213, -0.12483133375644684, -0.08355915546417236, -0.04228699207305908, -0.0010148212313652039, 0.040257349610328674, 0.08152952045202255, 0.12280169129371643, 0.1640738546848297, 0.2053460329771042, 0.24661821126937866, 0.28789037466049194, 0.3291625380516052, 0.3704347014427185, 0.4117068946361542, 0.45297905802726746, 0.49425122141838074, 0.5355234146118164, 0.5767955780029297, 0.618067741394043]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 4.0, 9.0, 23.0, 16.0, 23.0, 38.0, 37.0, 41.0, 57.0, 44.0, 57.0, 78.0, 67.0, 65.0, 63.0, 63.0, 54.0, 36.0, 30.0, 42.0, 35.0, 19.0, 26.0, 16.0, 13.0, 5.0, 5.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7429162263870239, -0.7242664694786072, -0.7056167125701904, -0.6869669556617737, -0.6683171987533569, -0.649667501449585, -0.6310176849365234, -0.6123679876327515, -0.5937182307243347, -0.575068473815918, -0.5564187169075012, -0.5377689599990845, -0.5191192030906677, -0.500469446182251, -0.4818197190761566, -0.46316999197006226, -0.4445202052593231, -0.42587044835090637, -0.4072206914424896, -0.38857096433639526, -0.3699212074279785, -0.35127145051956177, -0.332621693611145, -0.31397193670272827, -0.2953221797943115, -0.2766724228858948, -0.258022665977478, -0.23937292397022247, -0.22072318196296692, -0.20207342505455017, -0.18342366814613342, -0.16477392613887787, -0.14612418413162231, -0.12747442722320557, -0.10882468521595001, -0.09017492830753326, -0.07152517884969711, -0.05287542939186096, -0.034225672483444214, -0.01557593047618866, 0.0030738264322280884, 0.02172357775270939, 0.04037332907319069, 0.05902308225631714, 0.07767283171415329, 0.09632258117198944, 0.11497233808040619, 0.13362208008766174, 0.1522718369960785, 0.17092159390449524, 0.1895713359117508, 0.20822109282016754, 0.2268708348274231, 0.24552059173583984, 0.2641703486442566, 0.28282010555267334, 0.3014698624610901, 0.32011961936950684, 0.3387693762779236, 0.35741913318634033, 0.3760688602924347, 0.39471861720085144, 0.4133683741092682, 0.43201810121536255, 0.4506678581237793]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 19.0, 16.0, 26.0, 47.0, 45.0, 89.0, 117.0, 162.0, 231.0, 323.0, 487.0, 706.0, 1011.0, 1492.0, 2554.0, 4833.0, 9496.0, 24262.0, 84841.0, 520330.0, 305340.0, 55809.0, 17995.0, 7852.0, 4009.0, 2164.0, 1355.0, 894.0, 601.0, 397.0, 286.0, 215.0, 136.0, 102.0, 85.0, 62.0, 34.0, 29.0, 21.0, 11.0, 13.0, 8.0, 5.0, 3.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.091552734375, -0.08876609802246094, -0.08597946166992188, -0.08319282531738281, -0.08040618896484375, -0.07761955261230469, -0.07483291625976562, -0.07204627990722656, -0.0692596435546875, -0.06647300720214844, -0.06368637084960938, -0.06089973449707031, -0.05811309814453125, -0.05532646179199219, -0.052539825439453125, -0.04975318908691406, -0.046966552734375, -0.04417991638183594, -0.041393280029296875, -0.03860664367675781, -0.03582000732421875, -0.03303337097167969, -0.030246734619140625, -0.027460098266601562, -0.0246734619140625, -0.021886825561523438, -0.019100189208984375, -0.016313552856445312, -0.01352691650390625, -0.010740280151367188, -0.007953643798828125, -0.0051670074462890625, -0.00238037109375, 0.0004062652587890625, 0.003192901611328125, 0.0059795379638671875, 0.00876617431640625, 0.011552810668945312, 0.014339447021484375, 0.017126083374023438, 0.0199127197265625, 0.022699356079101562, 0.025485992431640625, 0.028272628784179688, 0.03105926513671875, 0.03384590148925781, 0.036632537841796875, 0.03941917419433594, 0.042205810546875, 0.04499244689941406, 0.047779083251953125, 0.05056571960449219, 0.05335235595703125, 0.05613899230957031, 0.058925628662109375, 0.06171226501464844, 0.0644989013671875, 0.06728553771972656, 0.07007217407226562, 0.07285881042480469, 0.07564544677734375, 0.07843208312988281, 0.08121871948242188, 0.08400535583496094, 0.0867919921875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 9.0, 17.0, 10.0, 29.0, 36.0, 51.0, 67.0, 100.0, 109.0, 141.0, 109.0, 95.0, 62.0, 42.0, 29.0, 18.0, 15.0, 10.0, 10.0, 4.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1607666015625, -0.15611839294433594, -0.15147018432617188, -0.1468219757080078, -0.14217376708984375, -0.1375255584716797, -0.13287734985351562, -0.12822914123535156, -0.1235809326171875, -0.11893272399902344, -0.11428451538085938, -0.10963630676269531, -0.10498809814453125, -0.10033988952636719, -0.09569168090820312, -0.09104347229003906, -0.086395263671875, -0.08174705505371094, -0.07709884643554688, -0.07245063781738281, -0.06780242919921875, -0.06315422058105469, -0.058506011962890625, -0.05385780334472656, -0.0492095947265625, -0.04456138610839844, -0.039913177490234375, -0.03526496887207031, -0.03061676025390625, -0.025968551635742188, -0.021320343017578125, -0.016672134399414062, -0.01202392578125, -0.0073757171630859375, -0.002727508544921875, 0.0019207000732421875, 0.00656890869140625, 0.011217117309570312, 0.015865325927734375, 0.020513534545898438, 0.0251617431640625, 0.029809951782226562, 0.034458160400390625, 0.03910636901855469, 0.04375457763671875, 0.04840278625488281, 0.053050994873046875, 0.05769920349121094, 0.062347412109375, 0.06699562072753906, 0.07164382934570312, 0.07629203796386719, 0.08094024658203125, 0.08558845520019531, 0.09023666381835938, 0.09488487243652344, 0.0995330810546875, 0.10418128967285156, 0.10882949829101562, 0.11347770690917969, 0.11812591552734375, 0.12277412414550781, 0.12742233276367188, 0.13207054138183594, 0.13671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 12.0, 19.0, 15.0, 24.0, 55.0, 82.0, 143.0, 223.0, 441.0, 840.0, 2140.0, 6210.0, 23209.0, 138905.0, 745259.0, 103875.0, 18679.0, 4980.0, 1789.0, 765.0, 379.0, 209.0, 113.0, 72.0, 34.0, 23.0, 21.0, 12.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.1510009765625, -0.146484375, -0.1419677734375, -0.137451171875, -0.1329345703125, -0.12841796875, -0.1239013671875, -0.119384765625, -0.1148681640625, -0.1103515625, -0.1058349609375, -0.101318359375, -0.0968017578125, -0.09228515625, -0.0877685546875, -0.083251953125, -0.0787353515625, -0.07421875, -0.0697021484375, -0.065185546875, -0.0606689453125, -0.05615234375, -0.0516357421875, -0.047119140625, -0.0426025390625, -0.0380859375, -0.0335693359375, -0.029052734375, -0.0245361328125, -0.02001953125, -0.0155029296875, -0.010986328125, -0.0064697265625, -0.001953125, 0.0025634765625, 0.007080078125, 0.0115966796875, 0.01611328125, 0.0206298828125, 0.025146484375, 0.0296630859375, 0.0341796875, 0.0386962890625, 0.043212890625, 0.0477294921875, 0.05224609375, 0.0567626953125, 0.061279296875, 0.0657958984375, 0.0703125, 0.0748291015625, 0.079345703125, 0.0838623046875, 0.08837890625, 0.0928955078125, 0.097412109375, 0.1019287109375, 0.1064453125, 0.1109619140625, 0.115478515625, 0.1199951171875, 0.12451171875, 0.1290283203125, 0.133544921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 13.0, 15.0, 18.0, 16.0, 30.0, 43.0, 47.0, 55.0, 54.0, 56.0, 68.0, 59.0, 82.0, 60.0, 68.0, 55.0, 46.0, 48.0, 37.0, 30.0, 29.0, 14.0, 17.0, 6.0, 4.0, 4.0, 9.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.3378143310546875, -0.324066162109375, -0.3103179931640625, -0.29656982421875, -0.2828216552734375, -0.269073486328125, -0.2553253173828125, -0.2415771484375, -0.2278289794921875, -0.214080810546875, -0.2003326416015625, -0.18658447265625, -0.1728363037109375, -0.159088134765625, -0.1453399658203125, -0.131591796875, -0.1178436279296875, -0.104095458984375, -0.0903472900390625, -0.07659912109375, -0.0628509521484375, -0.049102783203125, -0.0353546142578125, -0.0216064453125, -0.0078582763671875, 0.005889892578125, 0.0196380615234375, 0.03338623046875, 0.0471343994140625, 0.060882568359375, 0.0746307373046875, 0.08837890625, 0.1021270751953125, 0.115875244140625, 0.1296234130859375, 0.14337158203125, 0.1571197509765625, 0.170867919921875, 0.1846160888671875, 0.1983642578125, 0.2121124267578125, 0.225860595703125, 0.2396087646484375, 0.25335693359375, 0.2671051025390625, 0.280853271484375, 0.2946014404296875, 0.308349609375, 0.3220977783203125, 0.335845947265625, 0.3495941162109375, 0.36334228515625, 0.3770904541015625, 0.390838623046875, 0.4045867919921875, 0.4183349609375, 0.4320831298828125, 0.445831298828125, 0.4595794677734375, 0.47332763671875, 0.4870758056640625, 0.500823974609375, 0.5145721435546875, 0.5283203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 9.0, 12.0, 16.0, 17.0, 29.0, 38.0, 69.0, 101.0, 181.0, 297.0, 532.0, 1058.0, 2205.0, 6141.0, 22417.0, 144501.0, 744439.0, 100077.0, 17252.0, 5076.0, 1989.0, 887.0, 442.0, 293.0, 166.0, 94.0, 59.0, 37.0, 31.0, 24.0, 16.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01537322998046875, -0.014883875846862793, -0.014394521713256836, -0.013905167579650879, -0.013415813446044922, -0.012926459312438965, -0.012437105178833008, -0.01194775104522705, -0.011458396911621094, -0.010969042778015137, -0.01047968864440918, -0.009990334510803223, -0.009500980377197266, -0.009011626243591309, -0.008522272109985352, -0.008032917976379395, -0.0075435638427734375, -0.0070542097091674805, -0.0065648555755615234, -0.006075501441955566, -0.005586147308349609, -0.005096793174743652, -0.004607439041137695, -0.004118084907531738, -0.0036287307739257812, -0.0031393766403198242, -0.002650022506713867, -0.00216066837310791, -0.0016713142395019531, -0.001181960105895996, -0.0006926059722900391, -0.00020325183868408203, 0.000286102294921875, 0.000775456428527832, 0.001264810562133789, 0.001754164695739746, 0.002243518829345703, 0.00273287296295166, 0.003222227096557617, 0.0037115812301635742, 0.004200935363769531, 0.004690289497375488, 0.005179643630981445, 0.005668997764587402, 0.006158351898193359, 0.006647706031799316, 0.0071370601654052734, 0.0076264142990112305, 0.008115768432617188, 0.008605122566223145, 0.009094476699829102, 0.009583830833435059, 0.010073184967041016, 0.010562539100646973, 0.01105189323425293, 0.011541247367858887, 0.012030601501464844, 0.0125199556350708, 0.013009309768676758, 0.013498663902282715, 0.013988018035888672, 0.014477372169494629, 0.014966726303100586, 0.015456080436706543, 0.0159454345703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 8.0, 7.0, 7.0, 17.0, 17.0, 20.0, 28.0, 20.0, 41.0, 33.0, 75.0, 56.0, 31.0, 83.0, 66.0, 66.0, 77.0, 59.0, 37.0, 46.0, 34.0, 40.0, 29.0, 20.0, 24.0, 18.0, 14.0, 9.0, 0.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.494803190231323e-06, -5.327165126800537e-06, -5.159527063369751e-06, -4.991888999938965e-06, -4.824250936508179e-06, -4.656612873077393e-06, -4.4889748096466064e-06, -4.32133674621582e-06, -4.153698682785034e-06, -3.986060619354248e-06, -3.818422555923462e-06, -3.6507844924926758e-06, -3.4831464290618896e-06, -3.3155083656311035e-06, -3.1478703022003174e-06, -2.9802322387695312e-06, -2.812594175338745e-06, -2.644956111907959e-06, -2.477318048477173e-06, -2.3096799850463867e-06, -2.1420419216156006e-06, -1.9744038581848145e-06, -1.8067657947540283e-06, -1.6391277313232422e-06, -1.471489667892456e-06, -1.30385160446167e-06, -1.1362135410308838e-06, -9.685754776000977e-07, -8.009374141693115e-07, -6.332993507385254e-07, -4.6566128730773926e-07, -2.980232238769531e-07, -1.30385160446167e-07, 3.725290298461914e-08, 2.0489096641540527e-07, 3.725290298461914e-07, 5.401670932769775e-07, 7.078051567077637e-07, 8.754432201385498e-07, 1.043081283569336e-06, 1.210719347000122e-06, 1.3783574104309082e-06, 1.5459954738616943e-06, 1.7136335372924805e-06, 1.8812716007232666e-06, 2.0489096641540527e-06, 2.216547727584839e-06, 2.384185791015625e-06, 2.551823854446411e-06, 2.7194619178771973e-06, 2.8870999813079834e-06, 3.0547380447387695e-06, 3.2223761081695557e-06, 3.390014171600342e-06, 3.557652235031128e-06, 3.725290298461914e-06, 3.8929283618927e-06, 4.060566425323486e-06, 4.2282044887542725e-06, 4.395842552185059e-06, 4.563480615615845e-06, 4.731118679046631e-06, 4.898756742477417e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 8.0, 14.0, 18.0, 33.0, 38.0, 75.0, 112.0, 201.0, 440.0, 881.0, 2228.0, 8007.0, 53986.0, 739320.0, 216124.0, 20121.0, 4176.0, 1392.0, 613.0, 319.0, 155.0, 100.0, 73.0, 35.0, 31.0, 19.0, 11.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016312599182128906, -0.015703201293945312, -0.015093803405761719, -0.014484405517578125, -0.013875007629394531, -0.013265609741210938, -0.012656211853027344, -0.01204681396484375, -0.011437416076660156, -0.010828018188476562, -0.010218620300292969, -0.009609222412109375, -0.008999824523925781, -0.008390426635742188, -0.007781028747558594, -0.007171630859375, -0.006562232971191406, -0.0059528350830078125, -0.005343437194824219, -0.004734039306640625, -0.004124641418457031, -0.0035152435302734375, -0.0029058456420898438, -0.00229644775390625, -0.0016870498657226562, -0.0010776519775390625, -0.00046825408935546875, 0.000141143798828125, 0.0007505416870117188, 0.0013599395751953125, 0.0019693374633789062, 0.0025787353515625, 0.0031881332397460938, 0.0037975311279296875, 0.004406929016113281, 0.005016326904296875, 0.005625724792480469, 0.0062351226806640625, 0.006844520568847656, 0.00745391845703125, 0.008063316345214844, 0.008672714233398438, 0.009282112121582031, 0.009891510009765625, 0.010500907897949219, 0.011110305786132812, 0.011719703674316406, 0.0123291015625, 0.012938499450683594, 0.013547897338867188, 0.014157295227050781, 0.014766693115234375, 0.015376091003417969, 0.015985488891601562, 0.016594886779785156, 0.01720428466796875, 0.017813682556152344, 0.018423080444335938, 0.01903247833251953, 0.019641876220703125, 0.02025127410888672, 0.020860671997070312, 0.021470069885253906, 0.0220794677734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 10.0, 9.0, 10.0, 17.0, 27.0, 40.0, 67.0, 101.0, 125.0, 144.0, 144.0, 103.0, 66.0, 55.0, 39.0, 18.0, 16.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060760498046875, -0.059006690979003906, -0.05725288391113281, -0.05549907684326172, -0.053745269775390625, -0.05199146270751953, -0.05023765563964844, -0.048483848571777344, -0.04673004150390625, -0.044976234436035156, -0.04322242736816406, -0.04146862030029297, -0.039714813232421875, -0.03796100616455078, -0.03620719909667969, -0.034453392028808594, -0.0326995849609375, -0.030945777893066406, -0.029191970825195312, -0.02743816375732422, -0.025684356689453125, -0.02393054962158203, -0.022176742553710938, -0.020422935485839844, -0.01866912841796875, -0.016915321350097656, -0.015161514282226562, -0.013407707214355469, -0.011653900146484375, -0.009900093078613281, -0.008146286010742188, -0.006392478942871094, -0.004638671875, -0.0028848648071289062, -0.0011310577392578125, 0.0006227493286132812, 0.002376556396484375, 0.004130363464355469, 0.0058841705322265625, 0.007637977600097656, 0.00939178466796875, 0.011145591735839844, 0.012899398803710938, 0.014653205871582031, 0.016407012939453125, 0.01816082000732422, 0.019914627075195312, 0.021668434143066406, 0.0234222412109375, 0.025176048278808594, 0.026929855346679688, 0.02868366241455078, 0.030437469482421875, 0.03219127655029297, 0.03394508361816406, 0.035698890686035156, 0.03745269775390625, 0.039206504821777344, 0.04096031188964844, 0.04271411895751953, 0.044467926025390625, 0.04622173309326172, 0.04797554016113281, 0.049729347229003906, 0.051483154296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 8.0, 9.0, 12.0, 29.0, 55.0, 129.0, 324.0, 225.0, 87.0, 44.0, 36.0, 16.0, 8.0, 11.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1084856986999512, -1.0734870433807373, -1.0384883880615234, -1.00348961353302, -0.9684909582138062, -0.9334923028945923, -0.8984935879707336, -0.863494873046875, -0.8284962177276611, -0.7934975624084473, -0.7584988474845886, -0.72350013256073, -0.6885014772415161, -0.6535028219223022, -0.6185041069984436, -0.583505392074585, -0.5485067367553711, -0.5135080814361572, -0.4785093665122986, -0.44351068139076233, -0.4085119962692261, -0.3735133111476898, -0.33851462602615356, -0.3035159409046173, -0.26851725578308105, -0.2335185706615448, -0.19851988554000854, -0.1635212004184723, -0.12852251529693604, -0.09352383017539978, -0.058525145053863525, -0.02352645993232727, 0.011472344398498535, 0.04647102952003479, 0.08146971464157104, 0.1164683997631073, 0.15146708488464355, 0.1864657700061798, 0.22146445512771606, 0.2564631402492523, 0.2914618253707886, 0.32646051049232483, 0.3614591956138611, 0.39645788073539734, 0.4314565658569336, 0.46645525097846985, 0.5014539361000061, 0.5364526510238647, 0.5714513063430786, 0.6064499616622925, 0.6414486765861511, 0.6764473915100098, 0.7114460468292236, 0.7464447021484375, 0.7814434170722961, 0.8164421319961548, 0.8514407873153687, 0.8864394426345825, 0.9214381575584412, 0.9564368724822998, 0.9914355278015137, 1.0264341831207275, 1.0614328384399414, 1.0964316129684448, 1.1314302682876587]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 9.0, 6.0, 6.0, 20.0, 14.0, 20.0, 20.0, 21.0, 21.0, 24.0, 27.0, 31.0, 31.0, 36.0, 54.0, 68.0, 69.0, 91.0, 70.0, 51.0, 51.0, 34.0, 22.0, 36.0, 32.0, 31.0, 18.0, 16.0, 15.0, 10.0, 13.0, 10.0, 5.0, 4.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3760905265808105, -1.3369120359420776, -1.2977335453033447, -1.2585549354553223, -1.2193764448165894, -1.1801979541778564, -1.1410194635391235, -1.1018409729003906, -1.0626623630523682, -1.0234838724136353, -0.9843053221702576, -0.9451268315315247, -0.905948281288147, -0.8667697906494141, -0.8275913000106812, -0.7884128093719482, -0.7492343187332153, -0.7100558280944824, -0.6708772778511047, -0.6316987872123718, -0.5925202369689941, -0.5533417463302612, -0.5141632556915283, -0.474984735250473, -0.4358062148094177, -0.3966276943683624, -0.35744917392730713, -0.3182706832885742, -0.2790921628475189, -0.23991364240646362, -0.20073513686656952, -0.16155663132667542, -0.12237799167633057, -0.08319947868585587, -0.044020965695381165, -0.004842452704906464, 0.03433606028556824, 0.07351458072662354, 0.11269308626651764, 0.15187159180641174, 0.19105011224746704, 0.23022863268852234, 0.26940715312957764, 0.30858564376831055, 0.34776416420936584, 0.38694268465042114, 0.42612117528915405, 0.46529969573020935, 0.5044782161712646, 0.5436567068099976, 0.5828352570533752, 0.6220137476921082, 0.6611922979354858, 0.7003707885742188, 0.7395492792129517, 0.7787277698516846, 0.8179063200950623, 0.8570848107337952, 0.8962633609771729, 0.9354418516159058, 0.9746203422546387, 1.0137989521026611, 1.052977442741394, 1.092155933380127, 1.1313344240188599]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 6.0, 4.0, 8.0, 13.0, 25.0, 46.0, 105.0, 197.0, 440.0, 949.0, 1833.0, 3984.0, 7818.0, 17834.0, 52772.0, 214626.0, 2094987.0, 1567927.0, 172010.0, 36608.0, 10819.0, 4697.0, 2661.0, 1619.0, 989.0, 578.0, 323.0, 170.0, 105.0, 63.0, 28.0, 14.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0438232421875, -0.042359352111816406, -0.04089546203613281, -0.03943157196044922, -0.037967681884765625, -0.03650379180908203, -0.03503990173339844, -0.033576011657714844, -0.03211212158203125, -0.030648231506347656, -0.029184341430664062, -0.02772045135498047, -0.026256561279296875, -0.02479267120361328, -0.023328781127929688, -0.021864891052246094, -0.0204010009765625, -0.018937110900878906, -0.017473220825195312, -0.01600933074951172, -0.014545440673828125, -0.013081550598144531, -0.011617660522460938, -0.010153770446777344, -0.00868988037109375, -0.007225990295410156, -0.0057621002197265625, -0.004298210144042969, -0.002834320068359375, -0.0013704299926757812, 9.34600830078125e-05, 0.0015573501586914062, 0.003021240234375, 0.004485130310058594, 0.0059490203857421875, 0.007412910461425781, 0.008876800537109375, 0.010340690612792969, 0.011804580688476562, 0.013268470764160156, 0.01473236083984375, 0.016196250915527344, 0.017660140991210938, 0.01912403106689453, 0.020587921142578125, 0.02205181121826172, 0.023515701293945312, 0.024979591369628906, 0.0264434814453125, 0.027907371520996094, 0.029371261596679688, 0.03083515167236328, 0.032299041748046875, 0.03376293182373047, 0.03522682189941406, 0.036690711975097656, 0.03815460205078125, 0.039618492126464844, 0.04108238220214844, 0.04254627227783203, 0.044010162353515625, 0.04547405242919922, 0.04693794250488281, 0.048401832580566406, 0.04986572265625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 8.0, 14.0, 22.0, 31.0, 38.0, 48.0, 77.0, 89.0, 103.0, 116.0, 111.0, 76.0, 62.0, 59.0, 32.0, 21.0, 29.0, 17.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158203125, -0.1536407470703125, -0.149078369140625, -0.1445159912109375, -0.13995361328125, -0.1353912353515625, -0.130828857421875, -0.1262664794921875, -0.1217041015625, -0.1171417236328125, -0.112579345703125, -0.1080169677734375, -0.10345458984375, -0.0988922119140625, -0.094329833984375, -0.0897674560546875, -0.085205078125, -0.0806427001953125, -0.076080322265625, -0.0715179443359375, -0.06695556640625, -0.0623931884765625, -0.057830810546875, -0.0532684326171875, -0.0487060546875, -0.0441436767578125, -0.039581298828125, -0.0350189208984375, -0.03045654296875, -0.0258941650390625, -0.021331787109375, -0.0167694091796875, -0.01220703125, -0.0076446533203125, -0.003082275390625, 0.0014801025390625, 0.00604248046875, 0.0106048583984375, 0.015167236328125, 0.0197296142578125, 0.0242919921875, 0.0288543701171875, 0.033416748046875, 0.0379791259765625, 0.04254150390625, 0.0471038818359375, 0.051666259765625, 0.0562286376953125, 0.060791015625, 0.0653533935546875, 0.069915771484375, 0.0744781494140625, 0.07904052734375, 0.0836029052734375, 0.088165283203125, 0.0927276611328125, 0.0972900390625, 0.1018524169921875, 0.106414794921875, 0.1109771728515625, 0.11553955078125, 0.1201019287109375, 0.124664306640625, 0.1292266845703125, 0.1337890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 13.0, 33.0, 94.0, 297.0, 1227.0, 6403.0, 2466756.0, 1711676.0, 6143.0, 1146.0, 293.0, 80.0, 38.0, 22.0, 14.0, 8.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2183837890625, -0.21155738830566406, -0.20473098754882812, -0.1979045867919922, -0.19107818603515625, -0.1842517852783203, -0.17742538452148438, -0.17059898376464844, -0.1637725830078125, -0.15694618225097656, -0.15011978149414062, -0.1432933807373047, -0.13646697998046875, -0.1296405792236328, -0.12281417846679688, -0.11598777770996094, -0.109161376953125, -0.10233497619628906, -0.09550857543945312, -0.08868217468261719, -0.08185577392578125, -0.07502937316894531, -0.06820297241210938, -0.06137657165527344, -0.0545501708984375, -0.04772377014160156, -0.040897369384765625, -0.03407096862792969, -0.02724456787109375, -0.020418167114257812, -0.013591766357421875, -0.0067653656005859375, 6.103515625e-05, 0.0068874359130859375, 0.013713836669921875, 0.020540237426757812, 0.02736663818359375, 0.03419303894042969, 0.041019439697265625, 0.04784584045410156, 0.0546722412109375, 0.06149864196777344, 0.06832504272460938, 0.07515144348144531, 0.08197784423828125, 0.08880424499511719, 0.09563064575195312, 0.10245704650878906, 0.109283447265625, 0.11610984802246094, 0.12293624877929688, 0.1297626495361328, 0.13658905029296875, 0.1434154510498047, 0.15024185180664062, 0.15706825256347656, 0.1638946533203125, 0.17072105407714844, 0.17754745483398438, 0.1843738555908203, 0.19120025634765625, 0.1980266571044922, 0.20485305786132812, 0.21167945861816406, 0.218505859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 9.0, 6.0, 21.0, 47.0, 92.0, 219.0, 687.0, 1447.0, 880.0, 388.0, 132.0, 63.0, 24.0, 9.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12114906311035156, -0.11717605590820312, -0.11320304870605469, -0.10923004150390625, -0.10525703430175781, -0.10128402709960938, -0.09731101989746094, -0.0933380126953125, -0.08936500549316406, -0.08539199829101562, -0.08141899108886719, -0.07744598388671875, -0.07347297668457031, -0.06949996948242188, -0.06552696228027344, -0.061553955078125, -0.05758094787597656, -0.053607940673828125, -0.04963493347167969, -0.04566192626953125, -0.04168891906738281, -0.037715911865234375, -0.03374290466308594, -0.0297698974609375, -0.025796890258789062, -0.021823883056640625, -0.017850875854492188, -0.01387786865234375, -0.009904861450195312, -0.005931854248046875, -0.0019588470458984375, 0.00201416015625, 0.0059871673583984375, 0.009960174560546875, 0.013933181762695312, 0.01790618896484375, 0.021879196166992188, 0.025852203369140625, 0.029825210571289062, 0.0337982177734375, 0.03777122497558594, 0.041744232177734375, 0.04571723937988281, 0.04969024658203125, 0.05366325378417969, 0.057636260986328125, 0.06160926818847656, 0.065582275390625, 0.06955528259277344, 0.07352828979492188, 0.07750129699707031, 0.08147430419921875, 0.08544731140136719, 0.08942031860351562, 0.09339332580566406, 0.0973663330078125, 0.10133934020996094, 0.10531234741210938, 0.10928535461425781, 0.11325836181640625, 0.11723136901855469, 0.12120437622070312, 0.12517738342285156, 0.129150390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 11.0, 21.0, 21.0, 42.0, 82.0, 180.0, 323.0, 211.0, 65.0, 20.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.834306538105011, -0.8127552270889282, -0.7912038564682007, -0.7696525454521179, -0.7481011748313904, -0.7265498638153076, -0.7049984931945801, -0.6834471821784973, -0.6618958711624146, -0.6403445601463318, -0.6187931895256042, -0.5972418785095215, -0.575690507888794, -0.5541391968727112, -0.5325878858566284, -0.5110365152359009, -0.48948514461517334, -0.4679338037967682, -0.44638246297836304, -0.4248311519622803, -0.40327978134155273, -0.38172847032546997, -0.3601771295070648, -0.33862578868865967, -0.3170744478702545, -0.29552310705184937, -0.2739717662334442, -0.25242042541503906, -0.2308690994977951, -0.20931775867938995, -0.187766432762146, -0.16621509194374084, -0.14466369152069092, -0.12311235070228577, -0.10156101733446121, -0.08000968396663666, -0.058458343148231506, -0.036907002329826355, -0.015355676412582397, 0.006195664405822754, 0.027747005224227905, 0.04929834231734276, 0.07084967941045761, 0.09240101277828217, 0.11395235359668732, 0.13550369441509247, 0.15705502033233643, 0.17860636115074158, 0.20015770196914673, 0.22170904278755188, 0.24326038360595703, 0.2648116946220398, 0.28636306524276733, 0.3079143762588501, 0.32946571707725525, 0.3510170578956604, 0.37256839871406555, 0.3941197395324707, 0.41567108035087585, 0.437222421169281, 0.45877373218536377, 0.4803251028060913, 0.5018764138221741, 0.5234277248382568, 0.5449790954589844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 9.0, 18.0, 9.0, 24.0, 29.0, 29.0, 35.0, 22.0, 24.0, 30.0, 30.0, 41.0, 48.0, 39.0, 35.0, 23.0, 41.0, 45.0, 31.0, 33.0, 26.0, 28.0, 29.0, 31.0, 26.0, 22.0, 25.0, 21.0, 22.0, 23.0, 22.0, 16.0, 12.0, 17.0, 11.0, 11.0, 10.0, 9.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.39157378673553467, -0.3801146447658539, -0.3686555325984955, -0.3571963906288147, -0.3457372486591339, -0.3342781364917755, -0.3228189945220947, -0.31135988235473633, -0.29990074038505554, -0.28844159841537476, -0.27698248624801636, -0.26552334427833557, -0.2540642023086548, -0.2426050901412964, -0.2311459481716156, -0.219686821103096, -0.20822767913341522, -0.19676855206489563, -0.18530941009521484, -0.17385028302669525, -0.16239115595817566, -0.15093201398849487, -0.13947288691997528, -0.1280137598514557, -0.1165546253323555, -0.10509549081325531, -0.09363636374473572, -0.08217722922563553, -0.07071809470653534, -0.05925896763801575, -0.04779983311891556, -0.036340706050395966, -0.024881571531295776, -0.013422439806163311, -0.0019633080810308456, 0.009495824575424194, 0.020954955369234085, 0.032414086163043976, 0.043873220682144165, 0.05533234775066376, 0.06679148226976395, 0.07825061678886414, 0.08970974385738373, 0.10116887837648392, 0.1126280128955841, 0.1240871399641037, 0.1355462670326233, 0.14700540900230408, 0.15846453607082367, 0.16992366313934326, 0.18138280510902405, 0.19284193217754364, 0.20430105924606323, 0.21576020121574402, 0.2272193282842636, 0.2386784553527832, 0.250137597322464, 0.2615967392921448, 0.2730558514595032, 0.28451499342918396, 0.29597413539886475, 0.30743324756622314, 0.31889238953590393, 0.3303515315055847, 0.3418106436729431]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 12.0, 12.0, 20.0, 30.0, 31.0, 48.0, 69.0, 101.0, 146.0, 230.0, 325.0, 495.0, 767.0, 1275.0, 2230.0, 4225.0, 9713.0, 26204.0, 96092.0, 552201.0, 270137.0, 52466.0, 16739.0, 6902.0, 3215.0, 1735.0, 1035.0, 707.0, 454.0, 276.0, 189.0, 151.0, 96.0, 64.0, 48.0, 32.0, 18.0, 17.0, 11.0, 2.0, 6.0, 9.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0882568359375, -0.08572006225585938, -0.08318328857421875, -0.08064651489257812, -0.0781097412109375, -0.07557296752929688, -0.07303619384765625, -0.07049942016601562, -0.067962646484375, -0.06542587280273438, -0.06288909912109375, -0.060352325439453125, -0.0578155517578125, -0.055278778076171875, -0.05274200439453125, -0.050205230712890625, -0.04766845703125, -0.045131683349609375, -0.04259490966796875, -0.040058135986328125, -0.0375213623046875, -0.034984588623046875, -0.03244781494140625, -0.029911041259765625, -0.027374267578125, -0.024837493896484375, -0.02230072021484375, -0.019763946533203125, -0.0172271728515625, -0.014690399169921875, -0.01215362548828125, -0.009616851806640625, -0.007080078125, -0.004543304443359375, -0.00200653076171875, 0.000530242919921875, 0.0030670166015625, 0.005603790283203125, 0.00814056396484375, 0.010677337646484375, 0.013214111328125, 0.015750885009765625, 0.01828765869140625, 0.020824432373046875, 0.0233612060546875, 0.025897979736328125, 0.02843475341796875, 0.030971527099609375, 0.03350830078125, 0.036045074462890625, 0.03858184814453125, 0.041118621826171875, 0.0436553955078125, 0.046192169189453125, 0.04872894287109375, 0.051265716552734375, 0.053802490234375, 0.056339263916015625, 0.05887603759765625, 0.061412811279296875, 0.0639495849609375, 0.06648635864257812, 0.06902313232421875, 0.07155990600585938, 0.0740966796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 22.0, 32.0, 31.0, 48.0, 71.0, 104.0, 108.0, 118.0, 105.0, 87.0, 68.0, 55.0, 31.0, 20.0, 25.0, 19.0, 6.0, 4.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158203125, -0.1536388397216797, -0.14907455444335938, -0.14451026916503906, -0.13994598388671875, -0.13538169860839844, -0.13081741333007812, -0.1262531280517578, -0.1216888427734375, -0.11712455749511719, -0.11256027221679688, -0.10799598693847656, -0.10343170166015625, -0.09886741638183594, -0.09430313110351562, -0.08973884582519531, -0.085174560546875, -0.08061027526855469, -0.07604598999023438, -0.07148170471191406, -0.06691741943359375, -0.06235313415527344, -0.057788848876953125, -0.05322456359863281, -0.0486602783203125, -0.04409599304199219, -0.039531707763671875, -0.03496742248535156, -0.03040313720703125, -0.025838851928710938, -0.021274566650390625, -0.016710281372070312, -0.01214599609375, -0.0075817108154296875, -0.003017425537109375, 0.0015468597412109375, 0.00611114501953125, 0.010675430297851562, 0.015239715576171875, 0.019804000854492188, 0.0243682861328125, 0.028932571411132812, 0.033496856689453125, 0.03806114196777344, 0.04262542724609375, 0.04718971252441406, 0.051753997802734375, 0.05631828308105469, 0.060882568359375, 0.06544685363769531, 0.07001113891601562, 0.07457542419433594, 0.07913970947265625, 0.08370399475097656, 0.08826828002929688, 0.09283256530761719, 0.0973968505859375, 0.10196113586425781, 0.10652542114257812, 0.11108970642089844, 0.11565399169921875, 0.12021827697753906, 0.12478256225585938, 0.1293468475341797, 0.1339111328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 10.0, 14.0, 26.0, 32.0, 37.0, 59.0, 88.0, 120.0, 209.0, 261.0, 498.0, 821.0, 2167.0, 8013.0, 52798.0, 832126.0, 131387.0, 14233.0, 3049.0, 1096.0, 531.0, 308.0, 196.0, 117.0, 91.0, 78.0, 53.0, 34.0, 20.0, 23.0, 9.0, 11.0, 6.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11370849609375, -0.10869312286376953, -0.10367774963378906, -0.0986623764038086, -0.09364700317382812, -0.08863162994384766, -0.08361625671386719, -0.07860088348388672, -0.07358551025390625, -0.06857013702392578, -0.06355476379394531, -0.058539390563964844, -0.053524017333984375, -0.048508644104003906, -0.04349327087402344, -0.03847789764404297, -0.0334625244140625, -0.02844715118408203, -0.023431777954101562, -0.018416404724121094, -0.013401031494140625, -0.008385658264160156, -0.0033702850341796875, 0.0016450881958007812, 0.00666046142578125, 0.011675834655761719, 0.016691207885742188, 0.021706581115722656, 0.026721954345703125, 0.031737327575683594, 0.03675270080566406, 0.04176807403564453, 0.046783447265625, 0.05179882049560547, 0.05681419372558594, 0.061829566955566406, 0.06684494018554688, 0.07186031341552734, 0.07687568664550781, 0.08189105987548828, 0.08690643310546875, 0.09192180633544922, 0.09693717956542969, 0.10195255279541016, 0.10696792602539062, 0.1119832992553711, 0.11699867248535156, 0.12201404571533203, 0.1270294189453125, 0.13204479217529297, 0.13706016540527344, 0.1420755386352539, 0.14709091186523438, 0.15210628509521484, 0.1571216583251953, 0.16213703155517578, 0.16715240478515625, 0.17216777801513672, 0.1771831512451172, 0.18219852447509766, 0.18721389770507812, 0.1922292709350586, 0.19724464416503906, 0.20226001739501953, 0.207275390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 5.0, 9.0, 9.0, 10.0, 15.0, 18.0, 23.0, 23.0, 34.0, 35.0, 50.0, 56.0, 63.0, 69.0, 56.0, 70.0, 53.0, 51.0, 62.0, 62.0, 53.0, 35.0, 26.0, 21.0, 20.0, 16.0, 13.0, 10.0, 9.0, 8.0, 4.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274169921875, -0.2625236511230469, -0.25087738037109375, -0.23923110961914062, -0.2275848388671875, -0.21593856811523438, -0.20429229736328125, -0.19264602661132812, -0.180999755859375, -0.16935348510742188, -0.15770721435546875, -0.14606094360351562, -0.1344146728515625, -0.12276840209960938, -0.11112213134765625, -0.09947586059570312, -0.08782958984375, -0.07618331909179688, -0.06453704833984375, -0.052890777587890625, -0.0412445068359375, -0.029598236083984375, -0.01795196533203125, -0.006305694580078125, 0.005340576171875, 0.016986846923828125, 0.02863311767578125, 0.040279388427734375, 0.0519256591796875, 0.06357192993164062, 0.07521820068359375, 0.08686447143554688, 0.0985107421875, 0.11015701293945312, 0.12180328369140625, 0.13344955444335938, 0.1450958251953125, 0.15674209594726562, 0.16838836669921875, 0.18003463745117188, 0.191680908203125, 0.20332717895507812, 0.21497344970703125, 0.22661972045898438, 0.2382659912109375, 0.24991226196289062, 0.26155853271484375, 0.2732048034667969, 0.28485107421875, 0.2964973449707031, 0.30814361572265625, 0.3197898864746094, 0.3314361572265625, 0.3430824279785156, 0.35472869873046875, 0.3663749694824219, 0.378021240234375, 0.3896675109863281, 0.40131378173828125, 0.4129600524902344, 0.4246063232421875, 0.4362525939941406, 0.44789886474609375, 0.4595451354980469, 0.47119140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 2.0, 6.0, 10.0, 10.0, 13.0, 32.0, 35.0, 60.0, 138.0, 255.0, 624.0, 1519.0, 4603.0, 21058.0, 246842.0, 728153.0, 35367.0, 6452.0, 1912.0, 742.0, 325.0, 168.0, 73.0, 52.0, 26.0, 16.0, 21.0, 14.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.015779733657836914, -0.015125751495361328, -0.014471769332885742, -0.013817787170410156, -0.01316380500793457, -0.012509822845458984, -0.011855840682983398, -0.011201858520507812, -0.010547876358032227, -0.00989389419555664, -0.009239912033081055, -0.008585929870605469, -0.007931947708129883, -0.007277965545654297, -0.006623983383178711, -0.005970001220703125, -0.005316019058227539, -0.004662036895751953, -0.004008054733276367, -0.0033540725708007812, -0.0027000904083251953, -0.0020461082458496094, -0.0013921260833740234, -0.0007381439208984375, -8.416175842285156e-05, 0.0005698204040527344, 0.0012238025665283203, 0.0018777847290039062, 0.002531766891479492, 0.003185749053955078, 0.003839731216430664, 0.00449371337890625, 0.005147695541381836, 0.005801677703857422, 0.006455659866333008, 0.007109642028808594, 0.00776362419128418, 0.008417606353759766, 0.009071588516235352, 0.009725570678710938, 0.010379552841186523, 0.01103353500366211, 0.011687517166137695, 0.012341499328613281, 0.012995481491088867, 0.013649463653564453, 0.014303445816040039, 0.014957427978515625, 0.015611410140991211, 0.016265392303466797, 0.016919374465942383, 0.01757335662841797, 0.018227338790893555, 0.01888132095336914, 0.019535303115844727, 0.020189285278320312, 0.0208432674407959, 0.021497249603271484, 0.02215123176574707, 0.022805213928222656, 0.023459196090698242, 0.024113178253173828, 0.024767160415649414, 0.025421142578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 6.0, 4.0, 15.0, 9.0, 24.0, 19.0, 25.0, 22.0, 46.0, 33.0, 66.0, 35.0, 78.0, 46.0, 68.0, 37.0, 79.0, 64.0, 34.0, 66.0, 34.0, 33.0, 22.0, 26.0, 15.0, 16.0, 9.0, 10.0, 6.0, 8.0, 2.0, 8.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.589557647705078e-06, -4.438683390617371e-06, -4.287809133529663e-06, -4.1369348764419556e-06, -3.986060619354248e-06, -3.8351863622665405e-06, -3.684312105178833e-06, -3.5334378480911255e-06, -3.382563591003418e-06, -3.2316893339157104e-06, -3.080815076828003e-06, -2.9299408197402954e-06, -2.779066562652588e-06, -2.6281923055648804e-06, -2.477318048477173e-06, -2.3264437913894653e-06, -2.175569534301758e-06, -2.0246952772140503e-06, -1.8738210201263428e-06, -1.7229467630386353e-06, -1.5720725059509277e-06, -1.4211982488632202e-06, -1.2703239917755127e-06, -1.1194497346878052e-06, -9.685754776000977e-07, -8.177012205123901e-07, -6.668269634246826e-07, -5.159527063369751e-07, -3.650784492492676e-07, -2.1420419216156006e-07, -6.332993507385254e-08, 8.754432201385498e-08, 2.384185791015625e-07, 3.8929283618927e-07, 5.401670932769775e-07, 6.910413503646851e-07, 8.419156074523926e-07, 9.927898645401e-07, 1.1436641216278076e-06, 1.2945383787155151e-06, 1.4454126358032227e-06, 1.5962868928909302e-06, 1.7471611499786377e-06, 1.8980354070663452e-06, 2.0489096641540527e-06, 2.1997839212417603e-06, 2.3506581783294678e-06, 2.5015324354171753e-06, 2.652406692504883e-06, 2.8032809495925903e-06, 2.954155206680298e-06, 3.1050294637680054e-06, 3.255903720855713e-06, 3.4067779779434204e-06, 3.557652235031128e-06, 3.7085264921188354e-06, 3.859400749206543e-06, 4.0102750062942505e-06, 4.161149263381958e-06, 4.3120235204696655e-06, 4.462897777557373e-06, 4.6137720346450806e-06, 4.764646291732788e-06, 4.915520548820496e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 15.0, 20.0, 25.0, 27.0, 41.0, 95.0, 143.0, 255.0, 462.0, 902.0, 2132.0, 7746.0, 57911.0, 835488.0, 125259.0, 12557.0, 3073.0, 1147.0, 552.0, 273.0, 124.0, 96.0, 60.0, 47.0, 20.0, 14.0, 12.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0182342529296875, -0.017657995223999023, -0.017081737518310547, -0.01650547981262207, -0.015929222106933594, -0.015352964401245117, -0.01477670669555664, -0.014200448989868164, -0.013624191284179688, -0.013047933578491211, -0.012471675872802734, -0.011895418167114258, -0.011319160461425781, -0.010742902755737305, -0.010166645050048828, -0.009590387344360352, -0.009014129638671875, -0.008437871932983398, -0.007861614227294922, -0.007285356521606445, -0.006709098815917969, -0.006132841110229492, -0.005556583404541016, -0.004980325698852539, -0.0044040679931640625, -0.003827810287475586, -0.0032515525817871094, -0.002675294876098633, -0.0020990371704101562, -0.0015227794647216797, -0.0009465217590332031, -0.00037026405334472656, 0.00020599365234375, 0.0007822513580322266, 0.0013585090637207031, 0.0019347667694091797, 0.0025110244750976562, 0.003087282180786133, 0.0036635398864746094, 0.004239797592163086, 0.0048160552978515625, 0.005392313003540039, 0.005968570709228516, 0.006544828414916992, 0.007121086120605469, 0.007697343826293945, 0.008273601531982422, 0.008849859237670898, 0.009426116943359375, 0.010002374649047852, 0.010578632354736328, 0.011154890060424805, 0.011731147766113281, 0.012307405471801758, 0.012883663177490234, 0.013459920883178711, 0.014036178588867188, 0.014612436294555664, 0.01518869400024414, 0.015764951705932617, 0.016341209411621094, 0.01691746711730957, 0.017493724822998047, 0.018069982528686523, 0.018646240234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 10.0, 7.0, 20.0, 27.0, 37.0, 63.0, 86.0, 129.0, 152.0, 143.0, 120.0, 70.0, 50.0, 30.0, 21.0, 10.0, 4.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045562744140625, -0.044126033782958984, -0.04268932342529297, -0.04125261306762695, -0.03981590270996094, -0.03837919235229492, -0.036942481994628906, -0.03550577163696289, -0.034069061279296875, -0.03263235092163086, -0.031195640563964844, -0.029758930206298828, -0.028322219848632812, -0.026885509490966797, -0.02544879913330078, -0.024012088775634766, -0.02257537841796875, -0.021138668060302734, -0.01970195770263672, -0.018265247344970703, -0.016828536987304688, -0.015391826629638672, -0.013955116271972656, -0.01251840591430664, -0.011081695556640625, -0.00964498519897461, -0.008208274841308594, -0.006771564483642578, -0.0053348541259765625, -0.003898143768310547, -0.0024614334106445312, -0.0010247230529785156, 0.0004119873046875, 0.0018486976623535156, 0.0032854080200195312, 0.004722118377685547, 0.0061588287353515625, 0.007595539093017578, 0.009032249450683594, 0.01046895980834961, 0.011905670166015625, 0.01334238052368164, 0.014779090881347656, 0.016215801239013672, 0.017652511596679688, 0.019089221954345703, 0.02052593231201172, 0.021962642669677734, 0.02339935302734375, 0.024836063385009766, 0.02627277374267578, 0.027709484100341797, 0.029146194458007812, 0.030582904815673828, 0.032019615173339844, 0.03345632553100586, 0.034893035888671875, 0.03632974624633789, 0.037766456604003906, 0.03920316696166992, 0.04063987731933594, 0.04207658767700195, 0.04351329803466797, 0.044950008392333984, 0.04638671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 15.0, 26.0, 118.0, 355.0, 270.0, 110.0, 44.0, 19.0, 14.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5716817378997803, -0.5376864075660706, -0.5036910176277161, -0.46969568729400635, -0.43570032715797424, -0.40170496702194214, -0.3677096366882324, -0.3337142765522003, -0.2997189164161682, -0.2657235562801361, -0.2317282110452652, -0.1977328658103943, -0.16373750567436218, -0.12974214553833008, -0.09574680030345917, -0.06175145506858826, -0.027756094932556152, 0.006239257752895355, 0.04023461043834686, 0.07422996312379837, 0.10822531580924988, 0.14222067594528198, 0.1762160211801529, 0.2102113664150238, 0.2442067265510559, 0.278202086687088, 0.3121974468231201, 0.34619277715682983, 0.38018813729286194, 0.41418349742889404, 0.44817882776260376, 0.48217418789863586, 0.5161694288253784, 0.5501647591590881, 0.5841601490974426, 0.6181554794311523, 0.6521508693695068, 0.6861461997032166, 0.7201415300369263, 0.7541369199752808, 0.7881322503089905, 0.8221275806427002, 0.8561229705810547, 0.8901183009147644, 0.9241136312484741, 0.9581090211868286, 0.9921043515205383, 1.026099681854248, 1.0600950717926025, 1.094090461730957, 1.128085732460022, 1.1620811223983765, 1.196076512336731, 1.230071783065796, 1.2640671730041504, 1.2980625629425049, 1.3320579528808594, 1.3660533428192139, 1.4000486135482788, 1.4340440034866333, 1.4680393934249878, 1.5020346641540527, 1.5360300540924072, 1.5700254440307617, 1.6040207147598267]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 4.0, 13.0, 13.0, 8.0, 17.0, 13.0, 14.0, 18.0, 17.0, 26.0, 27.0, 34.0, 38.0, 40.0, 65.0, 82.0, 85.0, 82.0, 52.0, 41.0, 42.0, 29.0, 30.0, 27.0, 28.0, 22.0, 17.0, 14.0, 19.0, 13.0, 6.0, 12.0, 6.0, 5.0, 6.0, 1.0, 2.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9107792377471924, -0.8788121938705444, -0.8468451499938965, -0.8148781061172485, -0.7829110622406006, -0.7509440183639526, -0.7189769148826599, -0.687009871006012, -0.655042827129364, -0.6230757832527161, -0.5911087393760681, -0.5591416954994202, -0.5271745920181274, -0.4952075779438019, -0.46324050426483154, -0.4312734603881836, -0.39930641651153564, -0.3673393726348877, -0.33537232875823975, -0.3034052550792694, -0.27143821120262146, -0.2394711673259735, -0.20750410854816437, -0.17553704977035522, -0.14357000589370728, -0.11160295456647873, -0.07963590323925018, -0.04766885191202164, -0.01570180058479309, 0.01626524329185486, 0.048232302069664, 0.08019936084747314, 0.1121664047241211, 0.14413344860076904, 0.17610050737857819, 0.20806756615638733, 0.24003461003303528, 0.2720016539096832, 0.30396872758865356, 0.3359357714653015, 0.36790281534194946, 0.3998698592185974, 0.43183690309524536, 0.4638039767742157, 0.49577102065086365, 0.527738094329834, 0.5597051382064819, 0.5916721820831299, 0.6236392259597778, 0.6556062698364258, 0.6875733137130737, 0.7195403575897217, 0.7515074014663696, 0.7834744453430176, 0.8154415488243103, 0.8474085927009583, 0.8793756365776062, 0.9113426804542542, 0.9433097243309021, 0.97527676820755, 1.0072438716888428, 1.0392109155654907, 1.0711779594421387, 1.1031450033187866, 1.1351120471954346]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 6.0, 14.0, 32.0, 49.0, 96.0, 160.0, 293.0, 559.0, 843.0, 1287.0, 2065.0, 3379.0, 5469.0, 9166.0, 15015.0, 28358.0, 63701.0, 160445.0, 474572.0, 1818516.0, 1128019.0, 306556.0, 100408.0, 38294.0, 15720.0, 7264.0, 4216.0, 2746.0, 1977.0, 1483.0, 1098.0, 756.0, 592.0, 377.0, 253.0, 193.0, 120.0, 84.0, 49.0, 23.0, 17.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.031982421875, -0.031062841415405273, -0.030143260955810547, -0.02922368049621582, -0.028304100036621094, -0.027384519577026367, -0.02646493911743164, -0.025545358657836914, -0.024625778198242188, -0.02370619773864746, -0.022786617279052734, -0.021867036819458008, -0.02094745635986328, -0.020027875900268555, -0.019108295440673828, -0.0181887149810791, -0.017269134521484375, -0.01634955406188965, -0.015429973602294922, -0.014510393142700195, -0.013590812683105469, -0.012671232223510742, -0.011751651763916016, -0.010832071304321289, -0.009912490844726562, -0.008992910385131836, -0.00807332992553711, -0.007153749465942383, -0.006234169006347656, -0.00531458854675293, -0.004395008087158203, -0.0034754276275634766, -0.00255584716796875, -0.0016362667083740234, -0.0007166862487792969, 0.0002028942108154297, 0.0011224746704101562, 0.002042055130004883, 0.0029616355895996094, 0.003881216049194336, 0.0048007965087890625, 0.005720376968383789, 0.006639957427978516, 0.007559537887573242, 0.008479118347167969, 0.009398698806762695, 0.010318279266357422, 0.011237859725952148, 0.012157440185546875, 0.013077020645141602, 0.013996601104736328, 0.014916181564331055, 0.01583576202392578, 0.016755342483520508, 0.017674922943115234, 0.01859450340270996, 0.019514083862304688, 0.020433664321899414, 0.02135324478149414, 0.022272825241088867, 0.023192405700683594, 0.02411198616027832, 0.025031566619873047, 0.025951147079467773, 0.0268707275390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 16.0, 18.0, 21.0, 34.0, 43.0, 62.0, 71.0, 102.0, 93.0, 118.0, 108.0, 67.0, 54.0, 47.0, 38.0, 35.0, 11.0, 20.0, 8.0, 3.0, 6.0, 2.0, 8.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1552734375, -0.1507568359375, -0.146240234375, -0.1417236328125, -0.13720703125, -0.1326904296875, -0.128173828125, -0.1236572265625, -0.119140625, -0.1146240234375, -0.110107421875, -0.1055908203125, -0.10107421875, -0.0965576171875, -0.092041015625, -0.0875244140625, -0.0830078125, -0.0784912109375, -0.073974609375, -0.0694580078125, -0.06494140625, -0.0604248046875, -0.055908203125, -0.0513916015625, -0.046875, -0.0423583984375, -0.037841796875, -0.0333251953125, -0.02880859375, -0.0242919921875, -0.019775390625, -0.0152587890625, -0.0107421875, -0.0062255859375, -0.001708984375, 0.0028076171875, 0.00732421875, 0.0118408203125, 0.016357421875, 0.0208740234375, 0.025390625, 0.0299072265625, 0.034423828125, 0.0389404296875, 0.04345703125, 0.0479736328125, 0.052490234375, 0.0570068359375, 0.0615234375, 0.0660400390625, 0.070556640625, 0.0750732421875, 0.07958984375, 0.0841064453125, 0.088623046875, 0.0931396484375, 0.09765625, 0.1021728515625, 0.106689453125, 0.1112060546875, 0.11572265625, 0.1202392578125, 0.124755859375, 0.1292724609375, 0.1337890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 13.0, 34.0, 80.0, 199.0, 435.0, 1628.0, 40031.0, 4145683.0, 4969.0, 731.0, 281.0, 116.0, 44.0, 16.0, 10.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.2544898986816406, -0.24579620361328125, -0.23710250854492188, -0.2284088134765625, -0.21971511840820312, -0.21102142333984375, -0.20232772827148438, -0.193634033203125, -0.18494033813476562, -0.17624664306640625, -0.16755294799804688, -0.1588592529296875, -0.15016555786132812, -0.14147186279296875, -0.13277816772460938, -0.12408447265625, -0.11539077758789062, -0.10669708251953125, -0.09800338745117188, -0.0893096923828125, -0.08061599731445312, -0.07192230224609375, -0.06322860717773438, -0.054534912109375, -0.045841217041015625, -0.03714752197265625, -0.028453826904296875, -0.0197601318359375, -0.011066436767578125, -0.00237274169921875, 0.006320953369140625, 0.0150146484375, 0.023708343505859375, 0.03240203857421875, 0.041095733642578125, 0.0497894287109375, 0.058483123779296875, 0.06717681884765625, 0.07587051391601562, 0.084564208984375, 0.09325790405273438, 0.10195159912109375, 0.11064529418945312, 0.1193389892578125, 0.12803268432617188, 0.13672637939453125, 0.14542007446289062, 0.15411376953125, 0.16280746459960938, 0.17150115966796875, 0.18019485473632812, 0.1888885498046875, 0.19758224487304688, 0.20627593994140625, 0.21496963500976562, 0.223663330078125, 0.23235702514648438, 0.24105072021484375, 0.24974441528320312, 0.2584381103515625, 0.2671318054199219, 0.27582550048828125, 0.2845191955566406, 0.293212890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 12.0, 18.0, 36.0, 159.0, 566.0, 1677.0, 1132.0, 345.0, 74.0, 29.0, 12.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1968994140625, -0.1910552978515625, -0.185211181640625, -0.1793670654296875, -0.17352294921875, -0.1676788330078125, -0.161834716796875, -0.1559906005859375, -0.150146484375, -0.1443023681640625, -0.138458251953125, -0.1326141357421875, -0.12677001953125, -0.1209259033203125, -0.115081787109375, -0.1092376708984375, -0.1033935546875, -0.0975494384765625, -0.091705322265625, -0.0858612060546875, -0.08001708984375, -0.0741729736328125, -0.068328857421875, -0.0624847412109375, -0.056640625, -0.0507965087890625, -0.044952392578125, -0.0391082763671875, -0.03326416015625, -0.0274200439453125, -0.021575927734375, -0.0157318115234375, -0.0098876953125, -0.0040435791015625, 0.001800537109375, 0.0076446533203125, 0.01348876953125, 0.0193328857421875, 0.025177001953125, 0.0310211181640625, 0.036865234375, 0.0427093505859375, 0.048553466796875, 0.0543975830078125, 0.06024169921875, 0.0660858154296875, 0.071929931640625, 0.0777740478515625, 0.0836181640625, 0.0894622802734375, 0.095306396484375, 0.1011505126953125, 0.10699462890625, 0.1128387451171875, 0.118682861328125, 0.1245269775390625, 0.13037109375, 0.1362152099609375, 0.142059326171875, 0.1479034423828125, 0.15374755859375, 0.1595916748046875, 0.165435791015625, 0.1712799072265625, 0.1771240234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 8.0, 8.0, 14.0, 9.0, 20.0, 45.0, 112.0, 261.0, 329.0, 124.0, 35.0, 21.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0349597930908203, -1.0111228227615356, -0.9872857928276062, -0.9634488224983215, -0.9396118521690369, -0.9157748222351074, -0.8919378519058228, -0.8681008815765381, -0.8442639112472534, -0.8204269409179688, -0.7965899109840393, -0.7727529406547546, -0.74891597032547, -0.7250789403915405, -0.7012419700622559, -0.6774049997329712, -0.6535679697990417, -0.6297309994697571, -0.6058939695358276, -0.582056999206543, -0.5582200288772583, -0.5343830585479736, -0.5105460286140442, -0.4867090582847595, -0.46287205815315247, -0.4390350580215454, -0.41519808769226074, -0.3913610875606537, -0.36752408742904663, -0.34368711709976196, -0.3198501169681549, -0.29601311683654785, -0.2721761167049408, -0.24833913147449493, -0.22450214624404907, -0.20066514611244202, -0.17682816088199615, -0.1529911756515503, -0.12915417551994324, -0.10531719028949738, -0.08148020505905151, -0.05764321610331535, -0.03380622714757919, -0.009969234466552734, 0.013867750763893127, 0.03770473599433899, 0.061541736125946045, 0.0853787213563919, 0.10921570658683777, 0.13305269181728363, 0.1568896770477295, 0.18072667717933655, 0.2045636624097824, 0.22840064764022827, 0.2522376477718353, 0.2760746479034424, 0.29991161823272705, 0.3237486183643341, 0.3475855886936188, 0.37142258882522583, 0.3952595591545105, 0.41909655928611755, 0.4429335594177246, 0.4667705297470093, 0.49060752987861633]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 11.0, 10.0, 15.0, 11.0, 13.0, 19.0, 22.0, 20.0, 25.0, 36.0, 29.0, 37.0, 37.0, 40.0, 49.0, 38.0, 38.0, 48.0, 52.0, 32.0, 44.0, 42.0, 29.0, 34.0, 41.0, 31.0, 25.0, 25.0, 23.0, 19.0, 20.0, 17.0, 15.0, 11.0, 6.0, 9.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.36208075284957886, -0.3493303954601288, -0.3365800082683563, -0.32382965087890625, -0.3110792636871338, -0.2983289062976837, -0.28557854890823364, -0.2728281617164612, -0.2600778043270111, -0.24732743203639984, -0.23457705974578857, -0.2218267023563385, -0.20907633006572723, -0.19632595777511597, -0.1835755854845047, -0.17082521319389343, -0.15807484090328217, -0.1453244686126709, -0.13257409632205963, -0.11982373148202896, -0.10707336664199829, -0.09432299435138702, -0.08157262206077576, -0.06882225722074509, -0.05607188493013382, -0.04332151636481285, -0.030571145936846733, -0.017820775508880615, -0.005070406943559647, 0.007679961621761322, 0.02043033391237259, 0.03318069875240326, 0.045931071043014526, 0.058681439608335495, 0.07143180817365646, 0.08418218046426773, 0.0969325453042984, 0.10968291759490967, 0.12243328988552094, 0.1351836621761322, 0.14793401956558228, 0.16068439185619354, 0.1734347641468048, 0.18618512153625488, 0.19893549382686615, 0.21168586611747742, 0.22443623840808868, 0.23718661069869995, 0.24993698298931122, 0.2626873552799225, 0.27543771266937256, 0.288188099861145, 0.3009384572505951, 0.31368881464004517, 0.3264392018318176, 0.3391895592212677, 0.35193994641304016, 0.36469030380249023, 0.3774406909942627, 0.39019104838371277, 0.40294143557548523, 0.4156917929649353, 0.42844218015670776, 0.44119253754615784, 0.4539428949356079]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 8.0, 8.0, 10.0, 9.0, 13.0, 19.0, 25.0, 27.0, 47.0, 59.0, 71.0, 114.0, 129.0, 215.0, 346.0, 538.0, 844.0, 1489.0, 2598.0, 5257.0, 12538.0, 37718.0, 174195.0, 615256.0, 141874.0, 32529.0, 11351.0, 4933.0, 2518.0, 1363.0, 804.0, 490.0, 319.0, 240.0, 148.0, 112.0, 84.0, 62.0, 47.0, 22.0, 20.0, 29.0, 10.0, 15.0, 16.0, 6.0, 7.0, 2.0, 3.0, 6.0, 5.0, 2.0, 3.0], "bins": [-0.0980224609375, -0.09517669677734375, -0.0923309326171875, -0.08948516845703125, -0.086639404296875, -0.08379364013671875, -0.0809478759765625, -0.07810211181640625, -0.07525634765625, -0.07241058349609375, -0.0695648193359375, -0.06671905517578125, -0.063873291015625, -0.06102752685546875, -0.0581817626953125, -0.05533599853515625, -0.052490234375, -0.04964447021484375, -0.0467987060546875, -0.04395294189453125, -0.041107177734375, -0.03826141357421875, -0.0354156494140625, -0.03256988525390625, -0.02972412109375, -0.02687835693359375, -0.0240325927734375, -0.02118682861328125, -0.018341064453125, -0.01549530029296875, -0.0126495361328125, -0.00980377197265625, -0.0069580078125, -0.00411224365234375, -0.0012664794921875, 0.00157928466796875, 0.004425048828125, 0.00727081298828125, 0.0101165771484375, 0.01296234130859375, 0.01580810546875, 0.01865386962890625, 0.0214996337890625, 0.02434539794921875, 0.027191162109375, 0.03003692626953125, 0.0328826904296875, 0.03572845458984375, 0.03857421875, 0.04141998291015625, 0.0442657470703125, 0.04711151123046875, 0.049957275390625, 0.05280303955078125, 0.0556488037109375, 0.05849456787109375, 0.06134033203125, 0.06418609619140625, 0.0670318603515625, 0.06987762451171875, 0.072723388671875, 0.07556915283203125, 0.0784149169921875, 0.08126068115234375, 0.0841064453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 11.0, 19.0, 17.0, 33.0, 46.0, 72.0, 68.0, 92.0, 104.0, 112.0, 115.0, 60.0, 54.0, 52.0, 41.0, 35.0, 16.0, 13.0, 8.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1556396484375, -0.15111541748046875, -0.1465911865234375, -0.14206695556640625, -0.137542724609375, -0.13301849365234375, -0.1284942626953125, -0.12397003173828125, -0.11944580078125, -0.11492156982421875, -0.1103973388671875, -0.10587310791015625, -0.101348876953125, -0.09682464599609375, -0.0923004150390625, -0.08777618408203125, -0.083251953125, -0.07872772216796875, -0.0742034912109375, -0.06967926025390625, -0.065155029296875, -0.06063079833984375, -0.0561065673828125, -0.05158233642578125, -0.04705810546875, -0.04253387451171875, -0.0380096435546875, -0.03348541259765625, -0.028961181640625, -0.02443695068359375, -0.0199127197265625, -0.01538848876953125, -0.0108642578125, -0.00634002685546875, -0.0018157958984375, 0.00270843505859375, 0.007232666015625, 0.01175689697265625, 0.0162811279296875, 0.02080535888671875, 0.02532958984375, 0.02985382080078125, 0.0343780517578125, 0.03890228271484375, 0.043426513671875, 0.04795074462890625, 0.0524749755859375, 0.05699920654296875, 0.0615234375, 0.06604766845703125, 0.0705718994140625, 0.07509613037109375, 0.079620361328125, 0.08414459228515625, 0.0886688232421875, 0.09319305419921875, 0.09771728515625, 0.10224151611328125, 0.1067657470703125, 0.11128997802734375, 0.115814208984375, 0.12033843994140625, 0.1248626708984375, 0.12938690185546875, 0.1339111328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 14.0, 13.0, 16.0, 26.0, 28.0, 38.0, 60.0, 67.0, 122.0, 160.0, 286.0, 373.0, 648.0, 1153.0, 2722.0, 9441.0, 62414.0, 848911.0, 102743.0, 12728.0, 3244.0, 1284.0, 664.0, 390.0, 266.0, 168.0, 143.0, 109.0, 82.0, 56.0, 44.0, 33.0, 18.0, 27.0, 7.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15216636657714844, -0.14735031127929688, -0.1425342559814453, -0.13771820068359375, -0.1329021453857422, -0.12808609008789062, -0.12327003479003906, -0.1184539794921875, -0.11363792419433594, -0.10882186889648438, -0.10400581359863281, -0.09918975830078125, -0.09437370300292969, -0.08955764770507812, -0.08474159240722656, -0.079925537109375, -0.07510948181152344, -0.07029342651367188, -0.06547737121582031, -0.06066131591796875, -0.05584526062011719, -0.051029205322265625, -0.04621315002441406, -0.0413970947265625, -0.03658103942871094, -0.031764984130859375, -0.026948928833007812, -0.02213287353515625, -0.017316818237304688, -0.012500762939453125, -0.0076847076416015625, -0.00286865234375, 0.0019474029541015625, 0.006763458251953125, 0.011579513549804688, 0.01639556884765625, 0.021211624145507812, 0.026027679443359375, 0.030843734741210938, 0.0356597900390625, 0.04047584533691406, 0.045291900634765625, 0.05010795593261719, 0.05492401123046875, 0.05974006652832031, 0.06455612182617188, 0.06937217712402344, 0.074188232421875, 0.07900428771972656, 0.08382034301757812, 0.08863639831542969, 0.09345245361328125, 0.09826850891113281, 0.10308456420898438, 0.10790061950683594, 0.1127166748046875, 0.11753273010253906, 0.12234878540039062, 0.1271648406982422, 0.13198089599609375, 0.1367969512939453, 0.14161300659179688, 0.14642906188964844, 0.1512451171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 10.0, 4.0, 10.0, 6.0, 14.0, 18.0, 21.0, 20.0, 22.0, 23.0, 37.0, 42.0, 40.0, 55.0, 57.0, 67.0, 70.0, 53.0, 64.0, 57.0, 49.0, 36.0, 40.0, 26.0, 17.0, 16.0, 17.0, 10.0, 19.0, 16.0, 12.0, 10.0, 10.0, 10.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330810546875, -0.3205833435058594, -0.31035614013671875, -0.3001289367675781, -0.2899017333984375, -0.2796745300292969, -0.26944732666015625, -0.2592201232910156, -0.248992919921875, -0.23876571655273438, -0.22853851318359375, -0.21831130981445312, -0.2080841064453125, -0.19785690307617188, -0.18762969970703125, -0.17740249633789062, -0.16717529296875, -0.15694808959960938, -0.14672088623046875, -0.13649368286132812, -0.1262664794921875, -0.11603927612304688, -0.10581207275390625, -0.09558486938476562, -0.085357666015625, -0.07513046264648438, -0.06490325927734375, -0.054676055908203125, -0.0444488525390625, -0.034221649169921875, -0.02399444580078125, -0.013767242431640625, -0.0035400390625, 0.006687164306640625, 0.01691436767578125, 0.027141571044921875, 0.0373687744140625, 0.047595977783203125, 0.05782318115234375, 0.06805038452148438, 0.078277587890625, 0.08850479125976562, 0.09873199462890625, 0.10895919799804688, 0.1191864013671875, 0.12941360473632812, 0.13964080810546875, 0.14986801147460938, 0.16009521484375, 0.17032241821289062, 0.18054962158203125, 0.19077682495117188, 0.2010040283203125, 0.21123123168945312, 0.22145843505859375, 0.23168563842773438, 0.241912841796875, 0.2521400451660156, 0.26236724853515625, 0.2725944519042969, 0.2828216552734375, 0.2930488586425781, 0.30327606201171875, 0.3135032653808594, 0.32373046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 9.0, 16.0, 18.0, 22.0, 34.0, 51.0, 72.0, 105.0, 177.0, 245.0, 372.0, 626.0, 1142.0, 2265.0, 5737.0, 21872.0, 188674.0, 768034.0, 43403.0, 8896.0, 3087.0, 1469.0, 767.0, 482.0, 321.0, 199.0, 118.0, 82.0, 66.0, 41.0, 23.0, 28.0, 14.0, 14.0, 10.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 6.0, 1.0, 1.0], "bins": [-0.0260162353515625, -0.02529740333557129, -0.024578571319580078, -0.023859739303588867, -0.023140907287597656, -0.022422075271606445, -0.021703243255615234, -0.020984411239624023, -0.020265579223632812, -0.0195467472076416, -0.01882791519165039, -0.01810908317565918, -0.01739025115966797, -0.016671419143676758, -0.015952587127685547, -0.015233755111694336, -0.014514923095703125, -0.013796091079711914, -0.013077259063720703, -0.012358427047729492, -0.011639595031738281, -0.01092076301574707, -0.01020193099975586, -0.009483098983764648, -0.008764266967773438, -0.008045434951782227, -0.007326602935791016, -0.006607770919799805, -0.005888938903808594, -0.005170106887817383, -0.004451274871826172, -0.003732442855834961, -0.00301361083984375, -0.002294778823852539, -0.0015759468078613281, -0.0008571147918701172, -0.00013828277587890625, 0.0005805492401123047, 0.0012993812561035156, 0.0020182132720947266, 0.0027370452880859375, 0.0034558773040771484, 0.004174709320068359, 0.00489354133605957, 0.005612373352050781, 0.006331205368041992, 0.007050037384033203, 0.007768869400024414, 0.008487701416015625, 0.009206533432006836, 0.009925365447998047, 0.010644197463989258, 0.011363029479980469, 0.01208186149597168, 0.01280069351196289, 0.013519525527954102, 0.014238357543945312, 0.014957189559936523, 0.015676021575927734, 0.016394853591918945, 0.017113685607910156, 0.017832517623901367, 0.018551349639892578, 0.01927018165588379, 0.019989013671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 12.0, 36.0, 44.0, 91.0, 117.0, 171.0, 174.0, 148.0, 80.0, 54.0, 29.0, 17.0, 10.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5432946383953094e-05, -1.4951452612876892e-05, -1.446995884180069e-05, -1.3988465070724487e-05, -1.3506971299648285e-05, -1.3025477528572083e-05, -1.254398375749588e-05, -1.2062489986419678e-05, -1.1580996215343475e-05, -1.1099502444267273e-05, -1.061800867319107e-05, -1.0136514902114868e-05, -9.655021131038666e-06, -9.173527359962463e-06, -8.692033588886261e-06, -8.210539817810059e-06, -7.729046046733856e-06, -7.247552275657654e-06, -6.766058504581451e-06, -6.284564733505249e-06, -5.803070962429047e-06, -5.321577191352844e-06, -4.840083420276642e-06, -4.3585896492004395e-06, -3.877095878124237e-06, -3.3956021070480347e-06, -2.9141083359718323e-06, -2.43261456489563e-06, -1.9511207938194275e-06, -1.469627022743225e-06, -9.881332516670227e-07, -5.066394805908203e-07, -2.514570951461792e-08, 4.5634806156158447e-07, 9.378418326377869e-07, 1.4193356037139893e-06, 1.9008293747901917e-06, 2.382323145866394e-06, 2.8638169169425964e-06, 3.345310688018799e-06, 3.826804459095001e-06, 4.308298230171204e-06, 4.789792001247406e-06, 5.271285772323608e-06, 5.752779543399811e-06, 6.234273314476013e-06, 6.7157670855522156e-06, 7.197260856628418e-06, 7.67875462770462e-06, 8.160248398780823e-06, 8.641742169857025e-06, 9.123235940933228e-06, 9.60472971200943e-06, 1.0086223483085632e-05, 1.0567717254161835e-05, 1.1049211025238037e-05, 1.153070479631424e-05, 1.2012198567390442e-05, 1.2493692338466644e-05, 1.2975186109542847e-05, 1.3456679880619049e-05, 1.3938173651695251e-05, 1.4419667422771454e-05, 1.4901161193847656e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 9.0, 10.0, 12.0, 22.0, 30.0, 34.0, 56.0, 80.0, 123.0, 199.0, 322.0, 608.0, 1179.0, 2642.0, 7807.0, 50348.0, 902887.0, 67310.0, 9249.0, 2862.0, 1219.0, 597.0, 360.0, 187.0, 117.0, 81.0, 47.0, 38.0, 24.0, 18.0, 19.0, 11.0, 9.0, 9.0, 10.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.024383544921875, -0.023529529571533203, -0.022675514221191406, -0.02182149887084961, -0.020967483520507812, -0.020113468170166016, -0.01925945281982422, -0.018405437469482422, -0.017551422119140625, -0.016697406768798828, -0.01584339141845703, -0.014989376068115234, -0.014135360717773438, -0.01328134536743164, -0.012427330017089844, -0.011573314666748047, -0.01071929931640625, -0.009865283966064453, -0.009011268615722656, -0.00815725326538086, -0.0073032379150390625, -0.006449222564697266, -0.005595207214355469, -0.004741191864013672, -0.003887176513671875, -0.003033161163330078, -0.0021791458129882812, -0.0013251304626464844, -0.0004711151123046875, 0.0003829002380371094, 0.0012369155883789062, 0.002090930938720703, 0.0029449462890625, 0.003798961639404297, 0.004652976989746094, 0.005506992340087891, 0.0063610076904296875, 0.007215023040771484, 0.008069038391113281, 0.008923053741455078, 0.009777069091796875, 0.010631084442138672, 0.011485099792480469, 0.012339115142822266, 0.013193130493164062, 0.01404714584350586, 0.014901161193847656, 0.015755176544189453, 0.01660919189453125, 0.017463207244873047, 0.018317222595214844, 0.01917123794555664, 0.020025253295898438, 0.020879268646240234, 0.02173328399658203, 0.022587299346923828, 0.023441314697265625, 0.024295330047607422, 0.02514934539794922, 0.026003360748291016, 0.026857376098632812, 0.02771139144897461, 0.028565406799316406, 0.029419422149658203, 0.0302734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 2.0, 7.0, 6.0, 4.0, 4.0, 10.0, 9.0, 21.0, 16.0, 31.0, 30.0, 47.0, 52.0, 79.0, 62.0, 91.0, 77.0, 78.0, 62.0, 68.0, 52.0, 40.0, 33.0, 20.0, 20.0, 13.0, 11.0, 8.0, 2.0, 8.0, 6.0, 5.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.026611328125, -0.02567911148071289, -0.02474689483642578, -0.023814678192138672, -0.022882461547851562, -0.021950244903564453, -0.021018028259277344, -0.020085811614990234, -0.019153594970703125, -0.018221378326416016, -0.017289161682128906, -0.016356945037841797, -0.015424728393554688, -0.014492511749267578, -0.013560295104980469, -0.01262807846069336, -0.01169586181640625, -0.01076364517211914, -0.009831428527832031, -0.008899211883544922, -0.007966995239257812, -0.007034778594970703, -0.006102561950683594, -0.005170345306396484, -0.004238128662109375, -0.0033059120178222656, -0.0023736953735351562, -0.0014414787292480469, -0.0005092620849609375, 0.0004229545593261719, 0.0013551712036132812, 0.0022873878479003906, 0.0032196044921875, 0.004151821136474609, 0.005084037780761719, 0.006016254425048828, 0.0069484710693359375, 0.007880687713623047, 0.008812904357910156, 0.009745121002197266, 0.010677337646484375, 0.011609554290771484, 0.012541770935058594, 0.013473987579345703, 0.014406204223632812, 0.015338420867919922, 0.01627063751220703, 0.01720285415649414, 0.01813507080078125, 0.01906728744506836, 0.01999950408935547, 0.020931720733642578, 0.021863937377929688, 0.022796154022216797, 0.023728370666503906, 0.024660587310791016, 0.025592803955078125, 0.026525020599365234, 0.027457237243652344, 0.028389453887939453, 0.029321670532226562, 0.030253887176513672, 0.03118610382080078, 0.03211832046508789, 0.033050537109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 11.0, 23.0, 59.0, 199.0, 409.0, 150.0, 70.0, 31.0, 21.0, 13.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7281779050827026, -0.6901884078979492, -0.6521989107131958, -0.6142094135284424, -0.5762198567390442, -0.5382303595542908, -0.5002408623695374, -0.46225133538246155, -0.42426183819770813, -0.3862723410129547, -0.3482828140258789, -0.3102933168411255, -0.27230381965637207, -0.23431429266929626, -0.19632479548454285, -0.15833526849746704, -0.12034577131271362, -0.08235625922679901, -0.044366754591464996, -0.0063772499561309814, 0.03161226212978363, 0.06960177421569824, 0.10759127140045166, 0.14558079838752747, 0.18357029557228088, 0.2215598076581955, 0.2595493197441101, 0.2975388169288635, 0.33552831411361694, 0.37351784110069275, 0.41150733828544617, 0.449496865272522, 0.4874863624572754, 0.5254758596420288, 0.5634653568267822, 0.6014548540115356, 0.6394444108009338, 0.6774339079856873, 0.7154234051704407, 0.7534129619598389, 0.7914024591445923, 0.8293919563293457, 0.8673814535140991, 0.9053709506988525, 0.9433605074882507, 0.9813500046730042, 1.0193395614624023, 1.0573290586471558, 1.0953185558319092, 1.1333080530166626, 1.171297550201416, 1.2092870473861694, 1.2472765445709229, 1.2852661609649658, 1.3232555389404297, 1.3612451553344727, 1.3992345333099365, 1.43722403049469, 1.4752135276794434, 1.5132030248641968, 1.5511925220489502, 1.5891821384429932, 1.627171516418457, 1.6651611328125, 1.7031506299972534]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 6.0, 4.0, 6.0, 9.0, 11.0, 10.0, 17.0, 9.0, 18.0, 19.0, 28.0, 19.0, 22.0, 40.0, 48.0, 80.0, 108.0, 128.0, 88.0, 54.0, 34.0, 32.0, 34.0, 29.0, 32.0, 21.0, 14.0, 19.0, 10.0, 6.0, 11.0, 8.0, 3.0, 4.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130406379699707, -1.0927250385284424, -1.0550438165664673, -1.0173624753952026, -0.9796812534332275, -0.9419999718666077, -0.9043186902999878, -0.8666373491287231, -0.828956127166748, -0.7912748456001282, -0.7535935640335083, -0.7159122824668884, -0.6782310009002686, -0.6405497193336487, -0.6028684377670288, -0.5651870965957642, -0.5275058150291443, -0.4898245334625244, -0.45214325189590454, -0.41446197032928467, -0.3767806887626648, -0.3390994071960449, -0.30141809582710266, -0.2637368142604828, -0.22605553269386292, -0.18837425112724304, -0.15069296956062317, -0.1130116730928421, -0.07533039152622223, -0.037649109959602356, 3.218650817871094e-05, 0.037713468074798584, 0.07539474964141846, 0.11307603120803833, 0.1507573127746582, 0.18843860924243927, 0.22611989080905914, 0.2638011574745178, 0.3014824688434601, 0.33916375041007996, 0.37684503197669983, 0.4145263135433197, 0.4522075951099396, 0.48988890647888184, 0.5275701880455017, 0.5652514696121216, 0.6029327511787415, 0.6406140327453613, 0.6782953143119812, 0.7159765958786011, 0.753657877445221, 0.7913391590118408, 0.8290204405784607, 0.8667017221450806, 0.9043830633163452, 0.9420642852783203, 0.979745626449585, 1.0174269676208496, 1.0551081895828247, 1.0927895307540894, 1.1304707527160645, 1.168152093887329, 1.2058333158493042, 1.2435146570205688, 1.281195878982544]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 2.0, 5.0, 7.0, 7.0, 8.0, 7.0, 15.0, 16.0, 19.0, 20.0, 32.0, 52.0, 77.0, 107.0, 260.0, 390.0, 916.0, 3577.0, 16675.0, 91636.0, 1872373.0, 2114122.0, 72179.0, 13955.0, 4996.0, 1492.0, 500.0, 257.0, 186.0, 113.0, 66.0, 64.0, 40.0, 25.0, 17.0, 12.0, 13.0, 11.0, 7.0, 9.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1373291015625, -0.13316917419433594, -0.12900924682617188, -0.12484931945800781, -0.12068939208984375, -0.11652946472167969, -0.11236953735351562, -0.10820960998535156, -0.1040496826171875, -0.09988975524902344, -0.09572982788085938, -0.09156990051269531, -0.08740997314453125, -0.08325004577636719, -0.07909011840820312, -0.07493019104003906, -0.070770263671875, -0.06661033630371094, -0.062450408935546875, -0.05829048156738281, -0.05413055419921875, -0.04997062683105469, -0.045810699462890625, -0.04165077209472656, -0.0374908447265625, -0.03333091735839844, -0.029170989990234375, -0.025011062622070312, -0.02085113525390625, -0.016691207885742188, -0.012531280517578125, -0.008371353149414062, -0.00421142578125, -5.14984130859375e-05, 0.004108428955078125, 0.008268356323242188, 0.01242828369140625, 0.016588211059570312, 0.020748138427734375, 0.024908065795898438, 0.0290679931640625, 0.03322792053222656, 0.037387847900390625, 0.04154777526855469, 0.04570770263671875, 0.04986763000488281, 0.054027557373046875, 0.05818748474121094, 0.062347412109375, 0.06650733947753906, 0.07066726684570312, 0.07482719421386719, 0.07898712158203125, 0.08314704895019531, 0.08730697631835938, 0.09146690368652344, 0.0956268310546875, 0.09978675842285156, 0.10394668579101562, 0.10810661315917969, 0.11226654052734375, 0.11642646789550781, 0.12058639526367188, 0.12474632263183594, 0.12890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 15.0, 16.0, 28.0, 39.0, 41.0, 67.0, 75.0, 92.0, 114.0, 102.0, 98.0, 68.0, 67.0, 50.0, 33.0, 31.0, 19.0, 8.0, 7.0, 10.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.1506175994873047, -0.14608383178710938, -0.14155006408691406, -0.13701629638671875, -0.13248252868652344, -0.12794876098632812, -0.12341499328613281, -0.1188812255859375, -0.11434745788574219, -0.10981369018554688, -0.10527992248535156, -0.10074615478515625, -0.09621238708496094, -0.09167861938476562, -0.08714485168457031, -0.082611083984375, -0.07807731628417969, -0.07354354858398438, -0.06900978088378906, -0.06447601318359375, -0.05994224548339844, -0.055408477783203125, -0.05087471008300781, -0.0463409423828125, -0.04180717468261719, -0.037273406982421875, -0.03273963928222656, -0.02820587158203125, -0.023672103881835938, -0.019138336181640625, -0.014604568481445312, -0.01007080078125, -0.0055370330810546875, -0.001003265380859375, 0.0035305023193359375, 0.00806427001953125, 0.012598037719726562, 0.017131805419921875, 0.021665573120117188, 0.0261993408203125, 0.030733108520507812, 0.035266876220703125, 0.03980064392089844, 0.04433441162109375, 0.04886817932128906, 0.053401947021484375, 0.05793571472167969, 0.062469482421875, 0.06700325012207031, 0.07153701782226562, 0.07607078552246094, 0.08060455322265625, 0.08513832092285156, 0.08967208862304688, 0.09420585632324219, 0.0987396240234375, 0.10327339172363281, 0.10780715942382812, 0.11234092712402344, 0.11687469482421875, 0.12140846252441406, 0.12594223022460938, 0.1304759979248047, 0.135009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 7.0, 11.0, 13.0, 16.0, 20.0, 32.0, 35.0, 57.0, 81.0, 159.0, 261.0, 528.0, 1434.0, 6520.0, 1030193.0, 3142844.0, 8868.0, 1757.0, 661.0, 316.0, 141.0, 110.0, 53.0, 42.0, 37.0, 20.0, 16.0, 9.0, 7.0, 6.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39697265625, -0.385955810546875, -0.37493896484375, -0.363922119140625, -0.3529052734375, -0.341888427734375, -0.33087158203125, -0.319854736328125, -0.308837890625, -0.297821044921875, -0.28680419921875, -0.275787353515625, -0.2647705078125, -0.253753662109375, -0.24273681640625, -0.231719970703125, -0.220703125, -0.209686279296875, -0.19866943359375, -0.187652587890625, -0.1766357421875, -0.165618896484375, -0.15460205078125, -0.143585205078125, -0.132568359375, -0.121551513671875, -0.11053466796875, -0.099517822265625, -0.0885009765625, -0.077484130859375, -0.06646728515625, -0.055450439453125, -0.04443359375, -0.033416748046875, -0.02239990234375, -0.011383056640625, -0.0003662109375, 0.010650634765625, 0.02166748046875, 0.032684326171875, 0.043701171875, 0.054718017578125, 0.06573486328125, 0.076751708984375, 0.0877685546875, 0.098785400390625, 0.10980224609375, 0.120819091796875, 0.1318359375, 0.142852783203125, 0.15386962890625, 0.164886474609375, 0.1759033203125, 0.186920166015625, 0.19793701171875, 0.208953857421875, 0.219970703125, 0.230987548828125, 0.24200439453125, 0.253021240234375, 0.2640380859375, 0.275054931640625, 0.28607177734375, 0.297088623046875, 0.30810546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 4.0, 18.0, 26.0, 23.0, 31.0, 41.0, 76.0, 131.0, 214.0, 418.0, 881.0, 978.0, 492.0, 271.0, 135.0, 83.0, 71.0, 42.0, 24.0, 18.0, 22.0, 12.0, 11.0, 7.0, 2.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17578125, -0.16812515258789062, -0.16046905517578125, -0.15281295776367188, -0.1451568603515625, -0.13750076293945312, -0.12984466552734375, -0.12218856811523438, -0.114532470703125, -0.10687637329101562, -0.09922027587890625, -0.09156417846679688, -0.0839080810546875, -0.07625198364257812, -0.06859588623046875, -0.060939788818359375, -0.05328369140625, -0.045627593994140625, -0.03797149658203125, -0.030315399169921875, -0.0226593017578125, -0.015003204345703125, -0.00734710693359375, 0.000308990478515625, 0.007965087890625, 0.015621185302734375, 0.02327728271484375, 0.030933380126953125, 0.0385894775390625, 0.046245574951171875, 0.05390167236328125, 0.061557769775390625, 0.0692138671875, 0.07686996459960938, 0.08452606201171875, 0.09218215942382812, 0.0998382568359375, 0.10749435424804688, 0.11515045166015625, 0.12280654907226562, 0.130462646484375, 0.13811874389648438, 0.14577484130859375, 0.15343093872070312, 0.1610870361328125, 0.16874313354492188, 0.17639923095703125, 0.18405532836914062, 0.19171142578125, 0.19936752319335938, 0.20702362060546875, 0.21467971801757812, 0.2223358154296875, 0.22999191284179688, 0.23764801025390625, 0.24530410766601562, 0.252960205078125, 0.2606163024902344, 0.26827239990234375, 0.2759284973144531, 0.2835845947265625, 0.2912406921386719, 0.29889678955078125, 0.3065528869628906, 0.314208984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 24.0, 30.0, 41.0, 79.0, 170.0, 273.0, 140.0, 96.0, 58.0, 24.0, 20.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.142827033996582, -1.086534023284912, -1.0302411317825317, -0.9739481210708618, -0.9176551103591919, -0.8613621592521667, -0.8050692081451416, -0.7487761974334717, -0.6924832463264465, -0.6361902952194214, -0.5798972845077515, -0.5236043334007263, -0.4673113524913788, -0.41101837158203125, -0.3547254204750061, -0.29843243956565857, -0.24213945865631104, -0.1858464777469635, -0.12955351173877716, -0.07326054573059082, -0.016967564821243286, 0.03932541608810425, 0.0956183671951294, 0.15191134810447693, 0.20820432901382446, 0.264497309923172, 0.32079029083251953, 0.3770832419395447, 0.4333762228488922, 0.48966920375823975, 0.5459621548652649, 0.60225510597229, 0.65854811668396, 0.7148410677909851, 0.771134078502655, 0.8274270296096802, 0.8837200403213501, 0.9400129914283752, 0.9963059425354004, 1.0525989532470703, 1.1088919639587402, 1.1651849746704102, 1.2214778661727905, 1.2777708768844604, 1.3340638875961304, 1.3903567790985107, 1.4466497898101807, 1.5029428005218506, 1.559235692024231, 1.6155287027359009, 1.6718215942382812, 1.7281146049499512, 1.784407615661621, 1.840700626373291, 1.8969935178756714, 1.9532865285873413, 2.0095794200897217, 2.0658724308013916, 2.1221654415130615, 2.1784582138061523, 2.2347512245178223, 2.291044235229492, 2.347337245941162, 2.403630256652832, 2.459923267364502]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 5.0, 6.0, 6.0, 3.0, 6.0, 9.0, 13.0, 13.0, 15.0, 27.0, 32.0, 38.0, 36.0, 38.0, 52.0, 49.0, 58.0, 60.0, 80.0, 69.0, 61.0, 65.0, 57.0, 49.0, 30.0, 28.0, 34.0, 19.0, 15.0, 10.0, 9.0, 8.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5701770782470703, -1.514647126197815, -1.4591171741485596, -1.4035873413085938, -1.3480573892593384, -1.292527437210083, -1.2369976043701172, -1.1814676523208618, -1.1259377002716064, -1.070407748222351, -1.0148777961730957, -0.9593479633331299, -0.9038180112838745, -0.8482880592346191, -0.7927581667900085, -0.737228274345398, -0.6816983222961426, -0.6261683702468872, -0.5706384778022766, -0.515108585357666, -0.45957863330841064, -0.40404871106147766, -0.3485187888145447, -0.2929888665676117, -0.2374589443206787, -0.18192902207374573, -0.12639909982681274, -0.07086917757987976, -0.015339255332946777, 0.040190666913986206, 0.09572058916091919, 0.15125051140785217, 0.20678043365478516, 0.26231035590171814, 0.3178402781486511, 0.3733702003955841, 0.4289001226425171, 0.4844300448894501, 0.5399599671363831, 0.5954898595809937, 0.651019811630249, 0.7065497636795044, 0.762079656124115, 0.8176095485687256, 0.873139500617981, 0.9286694526672363, 0.9841993451118469, 1.0397292375564575, 1.095259189605713, 1.1507891416549683, 1.2063190937042236, 1.2618489265441895, 1.3173788785934448, 1.3729088306427002, 1.428438663482666, 1.4839686155319214, 1.5394985675811768, 1.5950285196304321, 1.6505584716796875, 1.7060883045196533, 1.7616182565689087, 1.817148208618164, 1.8726780414581299, 1.9282079935073853, 1.9837379455566406]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 14.0, 20.0, 32.0, 56.0, 85.0, 144.0, 230.0, 448.0, 961.0, 2031.0, 6036.0, 22475.0, 162403.0, 757050.0, 75598.0, 13856.0, 4013.0, 1526.0, 670.0, 341.0, 185.0, 133.0, 76.0, 42.0, 30.0, 27.0, 16.0, 12.0, 12.0, 7.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.18359375, -0.1789264678955078, -0.17425918579101562, -0.16959190368652344, -0.16492462158203125, -0.16025733947753906, -0.15559005737304688, -0.1509227752685547, -0.1462554931640625, -0.1415882110595703, -0.13692092895507812, -0.13225364685058594, -0.12758636474609375, -0.12291908264160156, -0.11825180053710938, -0.11358451843261719, -0.108917236328125, -0.10424995422363281, -0.09958267211914062, -0.09491539001464844, -0.09024810791015625, -0.08558082580566406, -0.08091354370117188, -0.07624626159667969, -0.0715789794921875, -0.06691169738769531, -0.062244415283203125, -0.05757713317871094, -0.05290985107421875, -0.04824256896972656, -0.043575286865234375, -0.03890800476074219, -0.03424072265625, -0.029573440551757812, -0.024906158447265625, -0.020238876342773438, -0.01557159423828125, -0.010904312133789062, -0.006237030029296875, -0.0015697479248046875, 0.0030975341796875, 0.0077648162841796875, 0.012432098388671875, 0.017099380493164062, 0.02176666259765625, 0.026433944702148438, 0.031101226806640625, 0.03576850891113281, 0.040435791015625, 0.04510307312011719, 0.049770355224609375, 0.05443763732910156, 0.05910491943359375, 0.06377220153808594, 0.06843948364257812, 0.07310676574707031, 0.0777740478515625, 0.08244132995605469, 0.08710861206054688, 0.09177589416503906, 0.09644317626953125, 0.10111045837402344, 0.10577774047851562, 0.11044502258300781, 0.1151123046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 6.0, 8.0, 25.0, 37.0, 50.0, 70.0, 84.0, 95.0, 109.0, 92.0, 91.0, 92.0, 71.0, 46.0, 43.0, 26.0, 14.0, 16.0, 4.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1678466796875, -0.16211700439453125, -0.1563873291015625, -0.15065765380859375, -0.144927978515625, -0.13919830322265625, -0.1334686279296875, -0.12773895263671875, -0.12200927734375, -0.11627960205078125, -0.1105499267578125, -0.10482025146484375, -0.099090576171875, -0.09336090087890625, -0.0876312255859375, -0.08190155029296875, -0.076171875, -0.07044219970703125, -0.0647125244140625, -0.05898284912109375, -0.053253173828125, -0.04752349853515625, -0.0417938232421875, -0.03606414794921875, -0.03033447265625, -0.02460479736328125, -0.0188751220703125, -0.01314544677734375, -0.007415771484375, -0.00168609619140625, 0.0040435791015625, 0.00977325439453125, 0.0155029296875, 0.02123260498046875, 0.0269622802734375, 0.03269195556640625, 0.038421630859375, 0.04415130615234375, 0.0498809814453125, 0.05561065673828125, 0.06134033203125, 0.06707000732421875, 0.0727996826171875, 0.07852935791015625, 0.084259033203125, 0.08998870849609375, 0.0957183837890625, 0.10144805908203125, 0.107177734375, 0.11290740966796875, 0.1186370849609375, 0.12436676025390625, 0.130096435546875, 0.13582611083984375, 0.1415557861328125, 0.14728546142578125, 0.15301513671875, 0.15874481201171875, 0.1644744873046875, 0.17020416259765625, 0.175933837890625, 0.18166351318359375, 0.1873931884765625, 0.19312286376953125, 0.1988525390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 9.0, 16.0, 12.0, 15.0, 19.0, 32.0, 47.0, 91.0, 145.0, 267.0, 510.0, 1147.0, 3718.0, 25744.0, 940385.0, 67305.0, 6081.0, 1604.0, 623.0, 294.0, 176.0, 83.0, 68.0, 36.0, 32.0, 16.0, 18.0, 13.0, 8.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.18201828002929688, -0.17543792724609375, -0.16885757446289062, -0.1622772216796875, -0.15569686889648438, -0.14911651611328125, -0.14253616333007812, -0.135955810546875, -0.12937545776367188, -0.12279510498046875, -0.11621475219726562, -0.1096343994140625, -0.10305404663085938, -0.09647369384765625, -0.08989334106445312, -0.08331298828125, -0.07673263549804688, -0.07015228271484375, -0.06357192993164062, -0.0569915771484375, -0.050411224365234375, -0.04383087158203125, -0.037250518798828125, -0.030670166015625, -0.024089813232421875, -0.01750946044921875, -0.010929107666015625, -0.0043487548828125, 0.002231597900390625, 0.00881195068359375, 0.015392303466796875, 0.02197265625, 0.028553009033203125, 0.03513336181640625, 0.041713714599609375, 0.0482940673828125, 0.054874420166015625, 0.06145477294921875, 0.06803512573242188, 0.074615478515625, 0.08119583129882812, 0.08777618408203125, 0.09435653686523438, 0.1009368896484375, 0.10751724243164062, 0.11409759521484375, 0.12067794799804688, 0.12725830078125, 0.13383865356445312, 0.14041900634765625, 0.14699935913085938, 0.1535797119140625, 0.16016006469726562, 0.16674041748046875, 0.17332077026367188, 0.179901123046875, 0.18648147583007812, 0.19306182861328125, 0.19964218139648438, 0.2062225341796875, 0.21280288696289062, 0.21938323974609375, 0.22596359252929688, 0.2325439453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 15.0, 14.0, 13.0, 20.0, 21.0, 24.0, 37.0, 29.0, 51.0, 43.0, 59.0, 71.0, 64.0, 79.0, 74.0, 57.0, 52.0, 41.0, 34.0, 28.0, 19.0, 13.0, 15.0, 22.0, 20.0, 20.0, 11.0, 4.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.376220703125, -0.36371612548828125, -0.3512115478515625, -0.33870697021484375, -0.326202392578125, -0.31369781494140625, -0.3011932373046875, -0.28868865966796875, -0.27618408203125, -0.26367950439453125, -0.2511749267578125, -0.23867034912109375, -0.226165771484375, -0.21366119384765625, -0.2011566162109375, -0.18865203857421875, -0.1761474609375, -0.16364288330078125, -0.1511383056640625, -0.13863372802734375, -0.126129150390625, -0.11362457275390625, -0.1011199951171875, -0.08861541748046875, -0.07611083984375, -0.06360626220703125, -0.0511016845703125, -0.03859710693359375, -0.026092529296875, -0.01358795166015625, -0.0010833740234375, 0.01142120361328125, 0.02392578125, 0.03643035888671875, 0.0489349365234375, 0.06143951416015625, 0.073944091796875, 0.08644866943359375, 0.0989532470703125, 0.11145782470703125, 0.12396240234375, 0.13646697998046875, 0.1489715576171875, 0.16147613525390625, 0.173980712890625, 0.18648529052734375, 0.1989898681640625, 0.21149444580078125, 0.2239990234375, 0.23650360107421875, 0.2490081787109375, 0.26151275634765625, 0.274017333984375, 0.28652191162109375, 0.2990264892578125, 0.31153106689453125, 0.32403564453125, 0.33654022216796875, 0.3490447998046875, 0.36154937744140625, 0.374053955078125, 0.38655853271484375, 0.3990631103515625, 0.41156768798828125, 0.424072265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 5.0, 11.0, 9.0, 19.0, 18.0, 24.0, 35.0, 43.0, 50.0, 70.0, 133.0, 231.0, 380.0, 621.0, 1202.0, 2653.0, 6973.0, 22429.0, 128428.0, 818860.0, 46512.0, 11802.0, 4199.0, 1738.0, 895.0, 446.0, 253.0, 163.0, 97.0, 64.0, 55.0, 24.0, 25.0, 17.0, 9.0, 13.0, 10.0, 5.0, 10.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01508331298828125, -0.01456749439239502, -0.014051675796508789, -0.013535857200622559, -0.013020038604736328, -0.012504220008850098, -0.011988401412963867, -0.011472582817077637, -0.010956764221191406, -0.010440945625305176, -0.009925127029418945, -0.009409308433532715, -0.008893489837646484, -0.008377671241760254, -0.007861852645874023, -0.007346034049987793, -0.0068302154541015625, -0.006314396858215332, -0.0057985782623291016, -0.005282759666442871, -0.004766941070556641, -0.00425112247467041, -0.0037353038787841797, -0.0032194852828979492, -0.0027036666870117188, -0.0021878480911254883, -0.0016720294952392578, -0.0011562108993530273, -0.0006403923034667969, -0.0001245737075805664, 0.00039124488830566406, 0.0009070634841918945, 0.001422882080078125, 0.0019387006759643555, 0.002454519271850586, 0.0029703378677368164, 0.003486156463623047, 0.004001975059509277, 0.004517793655395508, 0.005033612251281738, 0.005549430847167969, 0.006065249443054199, 0.00658106803894043, 0.00709688663482666, 0.007612705230712891, 0.008128523826599121, 0.008644342422485352, 0.009160161018371582, 0.009675979614257812, 0.010191798210144043, 0.010707616806030273, 0.011223435401916504, 0.011739253997802734, 0.012255072593688965, 0.012770891189575195, 0.013286709785461426, 0.013802528381347656, 0.014318346977233887, 0.014834165573120117, 0.015349984169006348, 0.015865802764892578, 0.01638162136077881, 0.01689743995666504, 0.01741325855255127, 0.0179290771484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 8.0, 5.0, 4.0, 12.0, 9.0, 6.0, 14.0, 9.0, 28.0, 25.0, 36.0, 45.0, 53.0, 63.0, 69.0, 59.0, 65.0, 40.0, 88.0, 65.0, 56.0, 51.0, 46.0, 40.0, 22.0, 22.0, 14.0, 12.0, 8.0, 8.0, 10.0, 8.0, 2.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-06, -5.189329385757446e-06, -5.014240741729736e-06, -4.839152097702026e-06, -4.664063453674316e-06, -4.4889748096466064e-06, -4.3138861656188965e-06, -4.1387975215911865e-06, -3.9637088775634766e-06, -3.7886202335357666e-06, -3.6135315895080566e-06, -3.4384429454803467e-06, -3.2633543014526367e-06, -3.0882656574249268e-06, -2.913177013397217e-06, -2.738088369369507e-06, -2.562999725341797e-06, -2.387911081314087e-06, -2.212822437286377e-06, -2.037733793258667e-06, -1.862645149230957e-06, -1.687556505203247e-06, -1.5124678611755371e-06, -1.3373792171478271e-06, -1.1622905731201172e-06, -9.872019290924072e-07, -8.121132850646973e-07, -6.370246410369873e-07, -4.6193599700927734e-07, -2.868473529815674e-07, -1.1175870895385742e-07, 6.332993507385254e-08, 2.384185791015625e-07, 4.1350722312927246e-07, 5.885958671569824e-07, 7.636845111846924e-07, 9.387731552124023e-07, 1.1138617992401123e-06, 1.2889504432678223e-06, 1.4640390872955322e-06, 1.6391277313232422e-06, 1.8142163753509521e-06, 1.989305019378662e-06, 2.164393663406372e-06, 2.339482307434082e-06, 2.514570951461792e-06, 2.689659595489502e-06, 2.864748239517212e-06, 3.039836883544922e-06, 3.214925527572632e-06, 3.390014171600342e-06, 3.5651028156280518e-06, 3.7401914596557617e-06, 3.915280103683472e-06, 4.090368747711182e-06, 4.265457391738892e-06, 4.4405460357666016e-06, 4.6156346797943115e-06, 4.7907233238220215e-06, 4.9658119678497314e-06, 5.140900611877441e-06, 5.315989255905151e-06, 5.491077899932861e-06, 5.666166543960571e-06, 5.841255187988281e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 12.0, 10.0, 16.0, 24.0, 30.0, 35.0, 43.0, 67.0, 99.0, 148.0, 215.0, 401.0, 648.0, 1193.0, 2563.0, 6506.0, 22217.0, 120856.0, 813334.0, 57897.0, 13376.0, 4450.0, 1987.0, 942.0, 514.0, 321.0, 192.0, 114.0, 81.0, 61.0, 50.0, 32.0, 19.0, 14.0, 16.0, 11.0, 14.0, 8.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0078277587890625, -0.007577776908874512, -0.0073277950286865234, -0.007077813148498535, -0.006827831268310547, -0.006577849388122559, -0.00632786750793457, -0.006077885627746582, -0.005827903747558594, -0.0055779218673706055, -0.005327939987182617, -0.005077958106994629, -0.004827976226806641, -0.004577994346618652, -0.004328012466430664, -0.004078030586242676, -0.0038280487060546875, -0.0035780668258666992, -0.003328084945678711, -0.0030781030654907227, -0.0028281211853027344, -0.002578139305114746, -0.002328157424926758, -0.0020781755447387695, -0.0018281936645507812, -0.001578211784362793, -0.0013282299041748047, -0.0010782480239868164, -0.0008282661437988281, -0.0005782842636108398, -0.00032830238342285156, -7.832050323486328e-05, 0.000171661376953125, 0.0004216432571411133, 0.0006716251373291016, 0.0009216070175170898, 0.0011715888977050781, 0.0014215707778930664, 0.0016715526580810547, 0.001921534538269043, 0.0021715164184570312, 0.0024214982986450195, 0.002671480178833008, 0.002921462059020996, 0.0031714439392089844, 0.0034214258193969727, 0.003671407699584961, 0.003921389579772949, 0.0041713714599609375, 0.004421353340148926, 0.004671335220336914, 0.004921317100524902, 0.005171298980712891, 0.005421280860900879, 0.005671262741088867, 0.0059212446212768555, 0.006171226501464844, 0.006421208381652832, 0.00667119026184082, 0.006921172142028809, 0.007171154022216797, 0.007421135902404785, 0.0076711177825927734, 0.007921099662780762, 0.00817108154296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 1.0, 5.0, 4.0, 9.0, 9.0, 8.0, 14.0, 16.0, 28.0, 41.0, 43.0, 84.0, 82.0, 97.0, 110.0, 95.0, 82.0, 66.0, 51.0, 35.0, 32.0, 36.0, 14.0, 7.0, 8.0, 6.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02850341796875, -0.02759718894958496, -0.026690959930419922, -0.025784730911254883, -0.024878501892089844, -0.023972272872924805, -0.023066043853759766, -0.022159814834594727, -0.021253585815429688, -0.02034735679626465, -0.01944112777709961, -0.01853489875793457, -0.01762866973876953, -0.016722440719604492, -0.015816211700439453, -0.014909982681274414, -0.014003753662109375, -0.013097524642944336, -0.012191295623779297, -0.011285066604614258, -0.010378837585449219, -0.00947260856628418, -0.00856637954711914, -0.0076601505279541016, -0.0067539215087890625, -0.0058476924896240234, -0.004941463470458984, -0.004035234451293945, -0.0031290054321289062, -0.002222776412963867, -0.0013165473937988281, -0.00041031837463378906, 0.00049591064453125, 0.001402139663696289, 0.002308368682861328, 0.003214597702026367, 0.004120826721191406, 0.005027055740356445, 0.005933284759521484, 0.0068395137786865234, 0.0077457427978515625, 0.008651971817016602, 0.00955820083618164, 0.01046442985534668, 0.011370658874511719, 0.012276887893676758, 0.013183116912841797, 0.014089345932006836, 0.014995574951171875, 0.015901803970336914, 0.016808032989501953, 0.017714262008666992, 0.01862049102783203, 0.01952672004699707, 0.02043294906616211, 0.02133917808532715, 0.022245407104492188, 0.023151636123657227, 0.024057865142822266, 0.024964094161987305, 0.025870323181152344, 0.026776552200317383, 0.027682781219482422, 0.02858901023864746, 0.0294952392578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 22.0, 36.0, 105.0, 450.0, 243.0, 81.0, 27.0, 24.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0593338012695312, -2.0001823902130127, -1.9410309791564941, -1.8818795680999756, -1.822728157043457, -1.7635767459869385, -1.7044254541397095, -1.645274043083191, -1.5861226320266724, -1.5269712209701538, -1.4678198099136353, -1.4086683988571167, -1.3495171070098877, -1.2903656959533691, -1.2312142848968506, -1.172062873840332, -1.1129114627838135, -1.053760051727295, -0.9946086406707764, -0.9354572892189026, -0.876305878162384, -0.8171544671058655, -0.7580031156539917, -0.6988517045974731, -0.6397002935409546, -0.580548882484436, -0.5213974714279175, -0.4622461199760437, -0.40309470891952515, -0.3439432978630066, -0.2847919166088104, -0.22564053535461426, -0.1664891242980957, -0.10733772814273834, -0.04818633198738098, 0.01096506416797638, 0.07011646032333374, 0.1292678713798523, 0.18841925263404846, 0.24757063388824463, 0.3067220449447632, 0.36587345600128174, 0.4250248372554779, 0.4841762185096741, 0.5433276295661926, 0.6024790406227112, 0.661630392074585, 0.7207818031311035, 0.7799332141876221, 0.8390846252441406, 0.8982360363006592, 0.957387387752533, 1.0165388584136963, 1.0756902694702148, 1.1348415613174438, 1.1939929723739624, 1.253144383430481, 1.3122957944869995, 1.371447205543518, 1.4305986166000366, 1.4897499084472656, 1.5489013195037842, 1.6080527305603027, 1.6672041416168213, 1.7263555526733398]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 6.0, 6.0, 9.0, 12.0, 11.0, 9.0, 15.0, 19.0, 19.0, 23.0, 24.0, 26.0, 31.0, 58.0, 145.0, 124.0, 117.0, 104.0, 44.0, 24.0, 29.0, 18.0, 16.0, 20.0, 16.0, 11.0, 13.0, 7.0, 9.0, 4.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.002690315246582, -0.9651963114738464, -0.9277023673057556, -0.89020836353302, -0.8527144193649292, -0.8152204155921936, -0.777726411819458, -0.7402324676513672, -0.7027385234832764, -0.6652445197105408, -0.62775057554245, -0.5902565717697144, -0.5527626276016235, -0.5152686238288879, -0.47777464985847473, -0.4402806758880615, -0.4027866721153259, -0.3652926981449127, -0.3277987241744995, -0.2903047204017639, -0.2528107762336731, -0.2153167873620987, -0.1778227984905243, -0.14032882452011108, -0.10283485054969788, -0.06534087657928467, -0.027846895158290863, 0.009647086262702942, 0.04714106023311615, 0.08463503420352936, 0.12212902307510376, 0.15962299704551697, 0.19711697101593018, 0.23461094498634338, 0.2721049189567566, 0.3095989227294922, 0.347092866897583, 0.3845868706703186, 0.4220808446407318, 0.459574818611145, 0.4970687925815582, 0.5345627665519714, 0.572056770324707, 0.6095507144927979, 0.6470447182655334, 0.6845386624336243, 0.7220326662063599, 0.7595266103744507, 0.7970206141471863, 0.8345146179199219, 0.8720085620880127, 0.9095025658607483, 0.9469965100288391, 0.9844905138015747, 1.0219844579696655, 1.059478521347046, 1.0969724655151367, 1.1344664096832275, 1.171960473060608, 1.2094544172286987, 1.2469483613967896, 1.2844423055648804, 1.3219363689422607, 1.3594303131103516, 1.3969242572784424]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 6.0, 8.0, 7.0, 17.0, 17.0, 24.0, 23.0, 21.0, 31.0, 60.0, 64.0, 309.0, 153.0, 52.0, 50.0, 39.0, 32.0, 20.0, 14.0, 13.0, 8.0, 7.0, 3.0, 5.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.07970714569091797, -0.07622337341308594, -0.0727396011352539, -0.06925582885742188, -0.06577205657958984, -0.06228828430175781, -0.05880451202392578, -0.05532073974609375, -0.05183696746826172, -0.04835319519042969, -0.044869422912597656, -0.041385650634765625, -0.037901878356933594, -0.03441810607910156, -0.03093433380126953, -0.0274505615234375, -0.02396678924560547, -0.020483016967773438, -0.016999244689941406, -0.013515472412109375, -0.010031700134277344, -0.0065479278564453125, -0.0030641555786132812, 0.00041961669921875, 0.0039033889770507812, 0.0073871612548828125, 0.010870933532714844, 0.014354705810546875, 0.017838478088378906, 0.021322250366210938, 0.02480602264404297, 0.028289794921875, 0.03177356719970703, 0.03525733947753906, 0.038741111755371094, 0.042224884033203125, 0.045708656311035156, 0.04919242858886719, 0.05267620086669922, 0.05615997314453125, 0.05964374542236328, 0.06312751770019531, 0.06661128997802734, 0.07009506225585938, 0.0735788345336914, 0.07706260681152344, 0.08054637908935547, 0.0840301513671875, 0.08751392364501953, 0.09099769592285156, 0.0944814682006836, 0.09796524047851562, 0.10144901275634766, 0.10493278503417969, 0.10841655731201172, 0.11190032958984375, 0.11538410186767578, 0.11886787414550781, 0.12235164642333984, 0.12583541870117188, 0.1293191909790039, 0.13280296325683594, 0.13628673553466797, 0.1397705078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 14.0, 12.0, 5.0, 10.0, 32.0, 29.0, 35.0, 89.0, 261.0, 904.0, 17378.0, 8366826.0, 2245.0, 378.0, 141.0, 67.0, 50.0, 20.0, 21.0, 20.0, 8.0, 3.0, 8.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.024310827255249, -0.9952173233032227, -0.9661238193511963, -0.9370303153991699, -0.9079368114471436, -0.8788433074951172, -0.8497498035430908, -0.8206563591957092, -0.7915628552436829, -0.7624693512916565, -0.7333758473396301, -0.7042823433876038, -0.6751888394355774, -0.6460953950881958, -0.6170018911361694, -0.5879083871841431, -0.5588148832321167, -0.5297213792800903, -0.500627875328064, -0.4715343713760376, -0.4424408972263336, -0.41334739327430725, -0.3842538893222809, -0.3551604151725769, -0.32606685161590576, -0.2969733476638794, -0.267879843711853, -0.23878635466098785, -0.20969286561012268, -0.1805993616580963, -0.15150585770606995, -0.12241236865520477, -0.0933188796043396, -0.06422538310289383, -0.03513188287615776, -0.006038382649421692, 0.02305511385202408, 0.05214861035346985, 0.08124211430549622, 0.11033560335636139, 0.13942910730838776, 0.16852261126041412, 0.1976161003112793, 0.22670960426330566, 0.25580310821533203, 0.2848966121673584, 0.31399011611938477, 0.34308359026908875, 0.3721770942211151, 0.4012705981731415, 0.43036410212516785, 0.4594575762748718, 0.4885510802268982, 0.5176445841789246, 0.5467380881309509, 0.5758315920829773, 0.6049250960350037, 0.63401859998703, 0.6631121039390564, 0.6922056078910828, 0.7212991118431091, 0.7503925561904907, 0.7794860601425171, 0.8085795640945435, 0.8376730680465698]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 6.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 3.0, 9.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31371912360191345, -0.30261167883872986, -0.2915042042732239, -0.2803967595100403, -0.2692893147468567, -0.2581818699836731, -0.24707439541816711, -0.23596695065498352, -0.22485949099063873, -0.21375203132629395, -0.20264458656311035, -0.19153712689876556, -0.18042966723442078, -0.16932222247123718, -0.1582147628068924, -0.1471073031425476, -0.135999858379364, -0.12489240616559982, -0.11378495395183563, -0.10267749428749084, -0.09157004207372665, -0.08046258985996246, -0.06935513019561768, -0.058247677981853485, -0.047140225768089294, -0.036032773554325104, -0.024925317615270615, -0.013817861676216125, -0.002710409462451935, 0.008397042751312256, 0.019504502415657043, 0.030611954629421234, 0.041719406843185425, 0.052826859056949615, 0.0639343112707138, 0.0750417709350586, 0.08614922314882278, 0.09725667536258698, 0.10836413502693176, 0.11947158724069595, 0.13057903945446014, 0.14168649911880493, 0.15279394388198853, 0.1639014035463333, 0.1750088632106781, 0.1861163079738617, 0.19722376763820648, 0.20833122730255127, 0.21943867206573486, 0.23054613173007965, 0.24165357649326324, 0.25276103615760803, 0.2638684809207916, 0.2749759554862976, 0.2860834002494812, 0.2971908450126648, 0.3082982897758484, 0.319405734539032, 0.33051320910453796, 0.34162065386772156, 0.35272809863090515, 0.36383557319641113, 0.3749430179595947, 0.3860504627227783, 0.3971579372882843]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 3.0, 12.0, 16.0, 22.0, 36.0, 42.0, 54.0, 111.0, 159.0, 255.0, 427.0, 758.0, 1278.0, 2795.0, 5905.0, 13867.0, 36472.0, 105084.0, 195544.0, 100579.0, 35235.0, 13558.0, 5813.0, 2732.0, 1467.0, 812.0, 441.0, 248.0, 167.0, 109.0, 63.0, 50.0, 35.0, 31.0, 17.0, 19.0, 13.0, 13.0, 4.0, 3.0, 7.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.16552734375, -0.159027099609375, -0.15252685546875, -0.146026611328125, -0.1395263671875, -0.133026123046875, -0.12652587890625, -0.120025634765625, -0.113525390625, -0.107025146484375, -0.10052490234375, -0.094024658203125, -0.0875244140625, -0.081024169921875, -0.07452392578125, -0.068023681640625, -0.0615234375, -0.055023193359375, -0.04852294921875, -0.042022705078125, -0.0355224609375, -0.029022216796875, -0.02252197265625, -0.016021728515625, -0.009521484375, -0.003021240234375, 0.00347900390625, 0.009979248046875, 0.0164794921875, 0.022979736328125, 0.02947998046875, 0.035980224609375, 0.04248046875, 0.048980712890625, 0.05548095703125, 0.061981201171875, 0.0684814453125, 0.074981689453125, 0.08148193359375, 0.087982177734375, 0.094482421875, 0.100982666015625, 0.10748291015625, 0.113983154296875, 0.1204833984375, 0.126983642578125, 0.13348388671875, 0.139984130859375, 0.146484375, 0.152984619140625, 0.15948486328125, 0.165985107421875, 0.1724853515625, 0.178985595703125, 0.18548583984375, 0.191986083984375, 0.198486328125, 0.204986572265625, 0.21148681640625, 0.217987060546875, 0.2244873046875, 0.230987548828125, 0.23748779296875, 0.243988037109375, 0.25048828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 12.0, 14.0, 20.0, 39.0, 40.0, 56.0, 100.0, 95.0, 114.0, 117.0, 102.0, 88.0, 56.0, 44.0, 28.0, 21.0, 12.0, 11.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15620040893554688, -0.15077972412109375, -0.14535903930664062, -0.1399383544921875, -0.13451766967773438, -0.12909698486328125, -0.12367630004882812, -0.118255615234375, -0.11283493041992188, -0.10741424560546875, -0.10199356079101562, -0.0965728759765625, -0.09115219116210938, -0.08573150634765625, -0.08031082153320312, -0.07489013671875, -0.06946945190429688, -0.06404876708984375, -0.058628082275390625, -0.0532073974609375, -0.047786712646484375, -0.04236602783203125, -0.036945343017578125, -0.031524658203125, -0.026103973388671875, -0.02068328857421875, -0.015262603759765625, -0.0098419189453125, -0.004421234130859375, 0.00099945068359375, 0.006420135498046875, 0.0118408203125, 0.017261505126953125, 0.02268218994140625, 0.028102874755859375, 0.0335235595703125, 0.038944244384765625, 0.04436492919921875, 0.049785614013671875, 0.055206298828125, 0.060626983642578125, 0.06604766845703125, 0.07146835327148438, 0.0768890380859375, 0.08230972290039062, 0.08773040771484375, 0.09315109252929688, 0.09857177734375, 0.10399246215820312, 0.10941314697265625, 0.11483383178710938, 0.1202545166015625, 0.12567520141601562, 0.13109588623046875, 0.13651657104492188, 0.141937255859375, 0.14735794067382812, 0.15277862548828125, 0.15819931030273438, 0.1636199951171875, 0.16904067993164062, 0.17446136474609375, 0.17988204956054688, 0.185302734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 6.0, 14.0, 47.0, 105.0, 143.0, 78.0, 24.0, 10.0, 10.0, 9.0, 7.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7061334848403931, -0.6857825517654419, -0.6654316186904907, -0.6450806856155396, -0.6247297525405884, -0.6043788194656372, -0.584027886390686, -0.5636769533157349, -0.5433260202407837, -0.5229750871658325, -0.5026241540908813, -0.4822732210159302, -0.461922287940979, -0.44157135486602783, -0.42122045159339905, -0.4008695185184479, -0.3805186152458191, -0.3601676821708679, -0.33981674909591675, -0.3194658160209656, -0.2991148829460144, -0.27876394987106323, -0.25841304659843445, -0.23806211352348328, -0.2177111804485321, -0.19736024737358093, -0.17700931429862976, -0.15665839612483978, -0.1363074630498886, -0.11595652997493744, -0.09560560435056686, -0.07525467872619629, -0.05490374565124512, -0.034552816301584244, -0.01420188695192337, 0.006149042397737503, 0.026499971747398376, 0.04685090482234955, 0.06720183044672012, 0.0875527560710907, 0.10790368914604187, 0.12825462222099304, 0.1486055552959442, 0.1689564734697342, 0.18930740654468536, 0.20965833961963654, 0.2300092577934265, 0.2503601908683777, 0.27071112394332886, 0.29106205701828003, 0.3114129900932312, 0.3317639231681824, 0.35211485624313354, 0.3724657893180847, 0.3928166925907135, 0.4131676256656647, 0.43351855874061584, 0.453869491815567, 0.4742204248905182, 0.49457135796546936, 0.5149222612380981, 0.5352731943130493, 0.5556241273880005, 0.5759750604629517, 0.5963259935379028]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 9.0, 26.0, 41.0, 94.0, 103.0, 89.0, 39.0, 18.0, 12.0, 3.0, 9.0, 4.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.2374911308288574, -1.206998348236084, -1.1765056848526, -1.1460129022598267, -1.1155202388763428, -1.0850274562835693, -1.0545347929000854, -1.024042010307312, -0.9935493469238281, -0.9630566239356995, -0.9325639009475708, -0.9020711779594421, -0.8715784549713135, -0.8410857319831848, -0.8105930089950562, -0.7801002264022827, -0.749607503414154, -0.7191147804260254, -0.6886220574378967, -0.6581293344497681, -0.6276366114616394, -0.5971438884735107, -0.5666511058807373, -0.5361584424972534, -0.50566565990448, -0.4751729369163513, -0.44468021392822266, -0.414187490940094, -0.38369476795196533, -0.35320204496383667, -0.3227092921733856, -0.29221656918525696, -0.2617238163948059, -0.23123109340667725, -0.20073837041854858, -0.17024563252925873, -0.13975290954113007, -0.1092601865530014, -0.07876744866371155, -0.048274725675582886, -0.017782002687454224, 0.012710724025964737, 0.0432034507393837, 0.07369618117809296, 0.10418890416622162, 0.13468162715435028, 0.16517436504364014, 0.1956670880317688, 0.22615981101989746, 0.2566525340080261, 0.2871452569961548, 0.31763797998428345, 0.3481307029724121, 0.37862342596054077, 0.4091161787509918, 0.4396089017391205, 0.47010162472724915, 0.5005943775177002, 0.5310871005058289, 0.5615798234939575, 0.5920725464820862, 0.6225652694702148, 0.6530579924583435, 0.6835507154464722, 0.7140434384346008]}, "eval/loss": 5.590612411499023, "eval/wer": 1.9976993256644189, "eval/runtime": 787.3401, "eval/samples_per_second": 3.356, "eval/steps_per_second": 0.281} \ No newline at end of file